From 7ac0862287270fcb0cfb33b01a31ae2e650621ef Mon Sep 17 00:00:00 2001
From: Sree Charan Manamala <sree.manamala@imply.io>
Date: Thu, 20 Jun 2024 15:05:58 +0530
Subject: [PATCH 01/72] Grouping Engine fix when a limit spec with different
 order by columns is applied (#16534)

---
 .../druid/query/groupby/GroupByQuery.java     | 155 ++++++++----------
 .../druid/query/groupby/GroupingEngine.java   |   5 +-
 .../druid/sql/calcite/CalciteQueryTest.java   |  31 +++-
 3 files changed, 99 insertions(+), 92 deletions(-)
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQuery.java b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQuery.java
index cdcf9e3daf4..994705f55e3 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQuery.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQuery.java
@@ -560,15 +560,20 @@ public class GroupByQuery extends BaseQuery<ResultRow>
     return false;
   }
 
-  /**
-   * When limit push down is applied, the partial results would be sorted by the ordering specified by the
-   * limit/order spec (unlike non-push down case where the results always use the default natural ascending order),
-   * so when merging these partial result streams, the merge needs to use the same ordering to get correct results.
-   */
-  private Ordering<ResultRow> getRowOrderingForPushDown(
-      final boolean granular,
-      final DefaultLimitSpec limitSpec
-  )
+  public Ordering<ResultRow> getRowOrdering(final boolean granular)
+  {
+    return getOrderingAndDimensions(granular).getRowOrdering();
+  }
+
+  public List<String> getDimensionNamesInOrder()
+  {
+    return getOrderingAndDimensions(false).getDimensions()
+                                          .stream()
+                                          .map(DimensionSpec::getOutputName)
+                                          .collect(Collectors.toList());
+  }
+
+  public OrderingAndDimensions getOrderingAndDimensions(final boolean granular)
   {
     final boolean sortByDimsFirst = getContextSortByDimsFirst();
 
@@ -577,18 +582,30 @@ public class GroupByQuery extends BaseQuery<ResultRow>
     final List<Boolean> needsReverseList = new ArrayList<>();
     final List<ColumnType> dimensionTypes = new ArrayList<>();
     final List<StringComparator> comparators = new ArrayList<>();
+    final List<DimensionSpec> dimensionsInOrder = new ArrayList<>();
 
-    for (OrderByColumnSpec orderSpec : limitSpec.getColumns()) {
-      boolean needsReverse = orderSpec.getDirection() != OrderByColumnSpec.Direction.ASCENDING;
-      int dimIndex = OrderByColumnSpec.getDimIndexForOrderBy(orderSpec, dimensions);
-      if (dimIndex >= 0) {
-        DimensionSpec dim = dimensions.get(dimIndex);
-        orderedFieldNumbers.add(resultRowSignature.indexOf(dim.getOutputName()));
-        dimsInOrderBy.add(dimIndex);
-        needsReverseList.add(needsReverse);
-        final ColumnType type = dimensions.get(dimIndex).getOutputType();
-        dimensionTypes.add(type);
-        comparators.add(orderSpec.getDimensionComparator());
+    /*
+     * When limit push down is applied, the partial results would be sorted by the ordering specified by the
+     * limit/order spec (unlike non-push down case where the results always use the default natural ascending order),
+     * so when merging these partial result streams, the merge needs to use the same ordering to get correct results.
+     */
+    if (isApplyLimitPushDown()) {
+      DefaultLimitSpec limitSpec1 = (DefaultLimitSpec) limitSpec;
+      if (!DefaultLimitSpec.sortingOrderHasNonGroupingFields(limitSpec1, dimensions)) {
+        for (OrderByColumnSpec orderSpec : ((DefaultLimitSpec) limitSpec).getColumns()) {
+          boolean needsReverse = orderSpec.getDirection() != OrderByColumnSpec.Direction.ASCENDING;
+          int dimIndex = OrderByColumnSpec.getDimIndexForOrderBy(orderSpec, dimensions);
+          if (dimIndex >= 0) {
+            DimensionSpec dim = dimensions.get(dimIndex);
+            orderedFieldNumbers.add(resultRowSignature.indexOf(dim.getOutputName()));
+            dimsInOrderBy.add(dimIndex);
+            needsReverseList.add(needsReverse);
+            final ColumnType type = dimensions.get(dimIndex).getOutputType();
+            dimensionTypes.add(type);
+            comparators.add(orderSpec.getDimensionComparator());
+            dimensionsInOrder.add(dim);
+          }
+        }
       }
     }
 
@@ -599,14 +616,16 @@ public class GroupByQuery extends BaseQuery<ResultRow>
         final ColumnType type = dimensions.get(i).getOutputType();
         dimensionTypes.add(type);
         comparators.add(StringComparators.NATURAL);
+        dimensionsInOrder.add(dimensions.get(i));
       }
     }
 
     final Comparator<ResultRow> timeComparator = getTimeComparator(granular);
+    Ordering<ResultRow> ordering;
 
     if (timeComparator == null) {
-      return Ordering.from(
-          (lhs, rhs) -> compareDimsForLimitPushDown(
+      ordering = Ordering.from(
+          (lhs, rhs) -> compareDims(
               orderedFieldNumbers,
               needsReverseList,
               dimensionTypes,
@@ -616,9 +635,9 @@ public class GroupByQuery extends BaseQuery<ResultRow>
           )
       );
     } else if (sortByDimsFirst) {
-      return Ordering.from(
+      ordering = Ordering.from(
           (lhs, rhs) -> {
-            final int cmp = compareDimsForLimitPushDown(
+            final int cmp = compareDims(
                 orderedFieldNumbers,
                 needsReverseList,
                 dimensionTypes,
@@ -634,7 +653,7 @@ public class GroupByQuery extends BaseQuery<ResultRow>
           }
       );
     } else {
-      return Ordering.from(
+      ordering = Ordering.from(
           (lhs, rhs) -> {
             final int timeCompare = timeComparator.compare(lhs, rhs);
 
@@ -642,7 +661,7 @@ public class GroupByQuery extends BaseQuery<ResultRow>
               return timeCompare;
             }
 
-            return compareDimsForLimitPushDown(
+            return compareDims(
                 orderedFieldNumbers,
                 needsReverseList,
                 dimensionTypes,
@@ -653,45 +672,8 @@ public class GroupByQuery extends BaseQuery<ResultRow>
           }
       );
     }
-  }
 
-  public Ordering<ResultRow> getRowOrdering(final boolean granular)
-  {
-    if (isApplyLimitPushDown()) {
-      if (!DefaultLimitSpec.sortingOrderHasNonGroupingFields((DefaultLimitSpec) limitSpec, dimensions)) {
-        return getRowOrderingForPushDown(granular, (DefaultLimitSpec) limitSpec);
-      }
-    }
-
-    final boolean sortByDimsFirst = getContextSortByDimsFirst();
-    final Comparator<ResultRow> timeComparator = getTimeComparator(granular);
-
-    if (timeComparator == null) {
-      return Ordering.from((lhs, rhs) -> compareDims(dimensions, lhs, rhs));
-    } else if (sortByDimsFirst) {
-      return Ordering.from(
-          (lhs, rhs) -> {
-            final int cmp = compareDims(dimensions, lhs, rhs);
-            if (cmp != 0) {
-              return cmp;
-            }
-
-            return timeComparator.compare(lhs, rhs);
-          }
-      );
-    } else {
-      return Ordering.from(
-          (lhs, rhs) -> {
-            final int timeCompare = timeComparator.compare(lhs, rhs);
-
-            if (timeCompare != 0) {
-              return timeCompare;
-            }
-
-            return compareDims(dimensions, lhs, rhs);
-          }
-      );
-    }
+    return new OrderingAndDimensions(ordering, dimensionsInOrder);
   }
 
   @Nullable
@@ -716,25 +698,6 @@ public class GroupByQuery extends BaseQuery<ResultRow>
     }
   }
 
-  private int compareDims(List<DimensionSpec> dimensions, ResultRow lhs, ResultRow rhs)
-  {
-    final int dimensionStart = getResultRowDimensionStart();
-
-    for (int i = 0; i < dimensions.size(); i++) {
-      DimensionSpec dimension = dimensions.get(i);
-      final int dimCompare = DimensionHandlerUtils.compareObjectsAsType(
-          lhs.get(dimensionStart + i),
-          rhs.get(dimensionStart + i),
-          dimension.getOutputType()
-      );
-      if (dimCompare != 0) {
-        return dimCompare;
-      }
-    }
-
-    return 0;
-  }
-
   /**
    * Computes the timestamp that will be returned by {@link #getUniversalTimestamp()}.
    */
@@ -760,12 +723,12 @@ public class GroupByQuery extends BaseQuery<ResultRow>
   }
 
   /**
-   * Compares the dimensions for limit pushdown.
+   * Compares the dimensions.
    *
    * Due to legacy reason, the provided StringComparator for the arrays isn't applied and must be changed once we
    * get rid of the StringComparators for array types
    */
-  private static int compareDimsForLimitPushDown(
+  private static int compareDims(
       final IntList fields,
       final List<Boolean> needsReverseList,
       final List<ColumnType> dimensionTypes,
@@ -924,6 +887,28 @@ public class GroupByQuery extends BaseQuery<ResultRow>
     }
   }
 
+  public static class OrderingAndDimensions
+  {
+    Ordering<ResultRow> rowOrdering;
+    List<DimensionSpec> dimensions;
+
+    public OrderingAndDimensions(Ordering<ResultRow> rowOrdering, List<DimensionSpec> dimensions)
+    {
+      this.rowOrdering = rowOrdering;
+      this.dimensions = dimensions;
+    }
+
+    public Ordering<ResultRow> getRowOrdering()
+    {
+      return rowOrdering;
+    }
+
+    public List<DimensionSpec> getDimensions()
+    {
+      return dimensions;
+    }
+  }
+
   public static class Builder
   {
     @Nullable
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/GroupingEngine.java b/processing/src/main/java/org/apache/druid/query/groupby/GroupingEngine.java
index 6451fb9b943..ab1ee1052b4 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/GroupingEngine.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/GroupingEngine.java
@@ -686,8 +686,7 @@ public class GroupingEngine
           processingConfig.intermediateComputeSizeBytes()
       );
 
-      List<String> queryDimNames = baseSubtotalQuery.getDimensions().stream().map(DimensionSpec::getOutputName)
-                                                    .collect(Collectors.toList());
+      List<String> queryDimNamesInOrder = baseSubtotalQuery.getDimensionNamesInOrder();
 
       // Only needed to make LimitSpec.filterColumns(..) call later in case base query has a non default LimitSpec.
       Set<String> aggsAndPostAggs = null;
@@ -724,7 +723,7 @@ public class GroupingEngine
             .withLimitSpec(subtotalQueryLimitSpec);
 
         final GroupByRowProcessor.ResultSupplier resultSupplierOneFinal = resultSupplierOne;
-        if (Utils.isPrefix(subtotalSpec, queryDimNames)) {
+        if (Utils.isPrefix(subtotalSpec, queryDimNamesInOrder)) {
           // Since subtotalSpec is a prefix of base query dimensions, so results from base query are also sorted
           // by subtotalSpec as needed by stream merging.
           subtotalsResults.add(
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
index 1975f5589e6..9a0a0318210 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
@@ -13823,10 +13823,8 @@ public class CalciteQueryTest extends BaseCalciteQueryTest
                         .build()
         ),
         ImmutableList.<Object[]>builder().add(
-            new Object[]{"", null, 2L},
-            new Object[]{"a", null, 1L},
-            new Object[]{"", null, 1L},
-            new Object[]{"a", null, 1L},
+            new Object[]{"", null, 3L},
+            new Object[]{"a", null, 2L},
             new Object[]{"abc", null, 1L},
             new Object[]{NULL_STRING, null, 6L},
             new Object[]{"", timestamp("2000-01-01"), 2L},
@@ -16290,4 +16288,29 @@ public class CalciteQueryTest extends BaseCalciteQueryTest
             )
         ).run();
   }
+
+  @SqlTestFrameworkConfig.NumMergeBuffers(3)
+  @Test
+  public void testGroupingSetsWithDifferentOrderLimitSpec()
+  {
+    msqIncompatible();
+    testBuilder()
+        .sql(
+            "SELECT\n"
+            + "  isNew, isRobot, COUNT(*) AS \"Cnt\"\n"
+            + "FROM \"wikipedia\"\n"
+            + "GROUP BY GROUPING SETS ((isRobot), (isNew))\n"
+            + "ORDER BY 2, 1\n"
+            + "limit 100"
+        )
+        .expectedResults(
+            ResultMatchMode.RELAX_NULLS,
+            ImmutableList.of(
+                new Object[]{"false", null, 36966L},
+                new Object[]{"true", null, 2278L},
+                new Object[]{null, "false", 23824L},
+                new Object[]{null, "true", 15420L}
+            )
+        ).run();
+  }
 }

From b20c3dbadfe299a8d4715d4ecc924ccfab432fc0 Mon Sep 17 00:00:00 2001
From: Abhishek Radhakrishnan <abhishek.rb19@gmail.com>
Date: Thu, 20 Jun 2024 08:40:28 -0700
Subject: [PATCH 02/72] Fix malformed period throwing `ADMIN` persona error
 (#16626)

* Turn invalid periods into user-facing exception providing more context.

The current exception is targeting the ADMIN persona. Catch that and turn
it into a USER persona instead. Also, provide more context in the error
message.

* Review comment: pass the wrapping expression and stringify.

* Update processing/src/main/java/org/apache/druid/query/expression/ExprUtils.java

Co-authored-by: Clint Wylie <cjwylie@gmail.com>

---------

Co-authored-by: Clint Wylie <cjwylie@gmail.com>
---
 .../druid/query/expression/ExprUtils.java     | 17 ++++++++++++--
 .../expression/TimestampCeilExprMacro.java    | 11 ++++++---
 .../expression/TimestampFloorExprMacro.java   | 11 ++++++---
 .../sql/calcite/planner/CalcitePlanner.java   |  2 +-
 .../sql/calcite/CalciteSelectQueryTest.java   | 23 +++++++++++++++++++
 5 files changed, 55 insertions(+), 9 deletions(-)

diff --git a/processing/src/main/java/org/apache/druid/query/expression/ExprUtils.java b/processing/src/main/java/org/apache/druid/query/expression/ExprUtils.java
index e2bd808d7b9..be513b40248 100644
--- a/processing/src/main/java/org/apache/druid/query/expression/ExprUtils.java
+++ b/processing/src/main/java/org/apache/druid/query/expression/ExprUtils.java
@@ -20,6 +20,7 @@
 package org.apache.druid.query.expression;
 
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.error.InvalidInput;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.granularity.PeriodGranularity;
@@ -45,13 +46,25 @@ public class ExprUtils
   }
 
   static PeriodGranularity toPeriodGranularity(
+      final Expr wrappingExpr,
       final Expr periodArg,
       @Nullable final Expr originArg,
       @Nullable final Expr timeZoneArg,
       final Expr.ObjectBinding bindings
   )
   {
-    final Period period = new Period(periodArg.eval(bindings).asString());
+    final Period period;
+    try {
+      period = new Period(periodArg.eval(bindings).asString());
+    }
+    catch (IllegalArgumentException iae) {
+      throw InvalidInput.exception(
+          "Invalid period[%s] specified for expression[%s]: [%s]",
+          periodArg.stringify(), 
+          wrappingExpr.stringify(),
+          iae.getMessage()
+      );
+    }
     final DateTime origin;
     final DateTimeZone timeZone;
 
@@ -69,7 +82,7 @@ public class ExprUtils
       final Object value = originArg.eval(bindings).valueOrDefault();
       if (value instanceof String && NullHandling.isNullOrEquivalent((String) value)) {
         // We get a blank string here, when sql compatible null handling is enabled
-        // and expression contains empty string for for origin
+        // and expression contains empty string for origin
         // e.g timestamp_floor(\"__time\",'PT1M','','UTC')
         origin = null;
       } else {
diff --git a/processing/src/main/java/org/apache/druid/query/expression/TimestampCeilExprMacro.java b/processing/src/main/java/org/apache/druid/query/expression/TimestampCeilExprMacro.java
index cfd63f1ea61..3c5102ae7a2 100644
--- a/processing/src/main/java/org/apache/druid/query/expression/TimestampCeilExprMacro.java
+++ b/processing/src/main/java/org/apache/druid/query/expression/TimestampCeilExprMacro.java
@@ -63,7 +63,7 @@ public class TimestampCeilExprMacro implements ExprMacroTable.ExprMacro
     TimestampCeilExpr(final TimestampCeilExprMacro macro, final List<Expr> args)
     {
       super(macro, args);
-      this.granularity = getGranularity(args, InputBindings.nilBindings());
+      this.granularity = getGranularity(this, args, InputBindings.nilBindings());
     }
 
     @Nonnull
@@ -113,9 +113,14 @@ public class TimestampCeilExprMacro implements ExprMacroTable.ExprMacro
     }
   }
 
-  private static PeriodGranularity getGranularity(final List<Expr> args, final Expr.ObjectBinding bindings)
+  private static PeriodGranularity getGranularity(
+      final Expr expr,
+      final List<Expr> args,
+      final Expr.ObjectBinding bindings
+  )
   {
     return ExprUtils.toPeriodGranularity(
+        expr,
         args.get(1),
         args.size() > 2 ? args.get(2) : null,
         args.size() > 3 ? args.get(3) : null,
@@ -135,7 +140,7 @@ public class TimestampCeilExprMacro implements ExprMacroTable.ExprMacro
     @Override
     public ExprEval eval(final ObjectBinding bindings)
     {
-      final PeriodGranularity granularity = getGranularity(args, bindings);
+      final PeriodGranularity granularity = getGranularity(this, args, bindings);
       long argTime = args.get(0).eval(bindings).asLong();
       long bucketStartTime = granularity.bucketStart(argTime);
       if (argTime == bucketStartTime) {
diff --git a/processing/src/main/java/org/apache/druid/query/expression/TimestampFloorExprMacro.java b/processing/src/main/java/org/apache/druid/query/expression/TimestampFloorExprMacro.java
index a243273b8f0..02eed7327f1 100644
--- a/processing/src/main/java/org/apache/druid/query/expression/TimestampFloorExprMacro.java
+++ b/processing/src/main/java/org/apache/druid/query/expression/TimestampFloorExprMacro.java
@@ -56,9 +56,14 @@ public class TimestampFloorExprMacro implements ExprMacroTable.ExprMacro
     }
   }
 
-  private static PeriodGranularity computeGranularity(final List<Expr> args, final Expr.ObjectBinding bindings)
+  private static PeriodGranularity computeGranularity(
+      final Expr expr,
+      final List<Expr> args,
+      final Expr.ObjectBinding bindings
+  )
   {
     return ExprUtils.toPeriodGranularity(
+        expr,
         args.get(1),
         args.size() > 2 ? args.get(2) : null,
         args.size() > 3 ? args.get(3) : null,
@@ -73,7 +78,7 @@ public class TimestampFloorExprMacro implements ExprMacroTable.ExprMacro
     TimestampFloorExpr(final TimestampFloorExprMacro macro, final List<Expr> args)
     {
       super(macro, args);
-      this.granularity = computeGranularity(args, InputBindings.nilBindings());
+      this.granularity = computeGranularity(this, args, InputBindings.nilBindings());
     }
 
     /**
@@ -170,7 +175,7 @@ public class TimestampFloorExprMacro implements ExprMacroTable.ExprMacro
     @Override
     public ExprEval eval(final ObjectBinding bindings)
     {
-      final PeriodGranularity granularity = computeGranularity(args, bindings);
+      final PeriodGranularity granularity = computeGranularity(this, args, bindings);
       return ExprEval.of(granularity.bucketStart(args.get(0).eval(bindings).asLong()));
     }
 
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalcitePlanner.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalcitePlanner.java
index 933baaac9ba..8eb9541961c 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalcitePlanner.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalcitePlanner.java
@@ -200,7 +200,7 @@ public class CalcitePlanner implements Planner, ViewExpander
 
     state = CalcitePlanner.State.STATE_2_READY;
 
-    // If user specify own traitDef, instead of default default trait,
+    // If user specifies own traitDef, instead of default trait,
     // register the trait def specified in traitDefs.
     if (this.traitDefs == null) {
       planner.addRelTraitDef(ConventionTraitDef.INSTANCE);
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSelectQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSelectQueryTest.java
index 3203ae9915e..d1f256207d5 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSelectQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSelectQueryTest.java
@@ -22,6 +22,7 @@ package org.apache.druid.sql.calcite;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.error.DruidExceptionMatcher;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.granularity.Granularities;
@@ -130,6 +131,28 @@ public class CalciteSelectQueryTest extends BaseCalciteQueryTest
     );
   }
 
+  @Test
+  public void testTimeCeilExpressionContainingInvalidPeriod()
+  {
+    testQueryThrows(
+        "SELECT TIME_CEIL(__time, 'PT1Y') FROM foo",
+        DruidExceptionMatcher.invalidInput().expectMessageContains(
+            "Invalid period['PT1Y'] specified for expression[timestamp_ceil(\"__time\", 'PT1Y', null, 'UTC')]"
+        )
+    );
+  }
+
+  @Test
+  public void testTimeFloorExpressionContainingInvalidPeriod()
+  {
+    testQueryThrows(
+        "SELECT TIME_FLOOR(TIMESTAMPADD(DAY, -1, __time), 'PT1D') FROM foo",
+        DruidExceptionMatcher.invalidInput().expectMessageContains(
+            "Invalid period['PT1D'] specified for expression[timestamp_floor((\"__time\" + -86400000), 'PT1D', null, 'UTC')]"
+        )
+    );
+  }
+
   @Test
   public void testValuesContainingNull()
   {

From ae70e18bc8e6caf57c6f469bc5cd971e69af6169 Mon Sep 17 00:00:00 2001
From: Andreas Maechler <amaechler@gmail.com>
Date: Thu, 20 Jun 2024 10:31:29 -0600
Subject: [PATCH 03/72] docs: Update Azure extension (#16585)

Co-authored-by: Victoria Lim <vtlim@users.noreply.github.com>
---
 docs/configuration/extensions.md          |  6 +-
 docs/configuration/index.md               | 22 +++---
 docs/development/extensions-core/azure.md | 84 +++++++++++++++++-----
 docs/development/extensions-core/hdfs.md  |  7 +-
 docs/development/extensions-core/s3.md    | 29 ++++----
 docs/ingestion/hadoop.md                  |  4 +-
 docs/ingestion/input-sources.md           | 88 ++++++++++++-----------
 docs/ingestion/native-batch.md            | 22 +++---
 website/.spelling                         |  1 +
 9 files changed, 161 insertions(+), 102 deletions(-)

diff --git a/docs/configuration/extensions.md b/docs/configuration/extensions.md
index 29356ebc05c..d396bc29000 100644
--- a/docs/configuration/extensions.md
+++ b/docs/configuration/extensions.md
@@ -22,7 +22,6 @@ title: "Extensions"
   ~ under the License.
   -->
 
-
 Druid implements an extension system that allows for adding functionality at runtime. Extensions
 are commonly used to add support for deep storages (like HDFS and S3), metadata stores (like MySQL
 and PostgreSQL), new aggregators, new input formats, and so on.
@@ -55,7 +54,7 @@ Core extensions are maintained by Druid committers.
 |druid-parquet-extensions|Support for data in Apache Parquet data format. Requires druid-avro-extensions to be loaded.|[link](../development/extensions-core/parquet.md)|
 |druid-protobuf-extensions| Support for data in Protobuf data format.|[link](../development/extensions-core/protobuf.md)|
 |druid-ranger-security|Support for access control through Apache Ranger.|[link](../development/extensions-core/druid-ranger-security.md)|
-|druid-s3-extensions|Interfacing with data in AWS S3, and using S3 as deep storage.|[link](../development/extensions-core/s3.md)|
+|druid-s3-extensions|Interfacing with data in Amazon S3, and using S3 as deep storage.|[link](../development/extensions-core/s3.md)|
 |druid-ec2-extensions|Interfacing with AWS EC2 for autoscaling middle managers|UNDOCUMENTED|
 |druid-aws-rds-extensions|Support for AWS token based access to AWS RDS DB Cluster.|[link](../development/extensions-core/druid-aws-rds.md)|
 |druid-stats|Statistics related module including variance and standard deviation.|[link](../development/extensions-core/stats.md)|
@@ -101,7 +100,7 @@ All of these community extensions can be downloaded using [pull-deps](../operati
 |druid-momentsketch|Support for approximate quantile queries using the [momentsketch](https://github.com/stanford-futuredata/momentsketch) library|[link](../development/extensions-contrib/momentsketch-quantiles.md)|
 |druid-tdigestsketch|Support for approximate sketch aggregators based on [T-Digest](https://github.com/tdunning/t-digest)|[link](../development/extensions-contrib/tdigestsketch-quantiles.md)|
 |gce-extensions|GCE Extensions|[link](../development/extensions-contrib/gce-extensions.md)|
-|prometheus-emitter|Exposes [Druid metrics](../operations/metrics.md) for Prometheus server collection (https://prometheus.io/)|[link](../development/extensions-contrib/prometheus.md)|
+|prometheus-emitter|Exposes [Druid metrics](../operations/metrics.md) for Prometheus server collection (<https://prometheus.io/>)|[link](../development/extensions-contrib/prometheus.md)|
 |druid-kubernetes-overlord-extensions|Support for launching tasks in k8s without Middle Managers|[link](../development/extensions-contrib/k8s-jobs.md)|
 |druid-spectator-histogram|Support for efficient approximate percentile queries|[link](../development/extensions-contrib/spectator-histogram.md)|
 |druid-rabbit-indexing-service|Support for creating and managing [RabbitMQ](https://www.rabbitmq.com/) indexing tasks|[link](../development/extensions-contrib/rabbit-stream-ingestion.md)|
@@ -111,7 +110,6 @@ All of these community extensions can be downloaded using [pull-deps](../operati
 Please post on [dev@druid.apache.org](https://lists.apache.org/list.html?dev@druid.apache.org) if you'd like an extension to be promoted to core.
 If we see a community extension actively supported by the community, we can promote it to core based on community feedback.
 
-
 For information how to create your own extension, please see [here](../development/modules.md).
 
 ## Loading extensions
diff --git a/docs/configuration/index.md b/docs/configuration/index.md
index 4eceec8beec..b62ab9c0db8 100644
--- a/docs/configuration/index.md
+++ b/docs/configuration/index.md
@@ -668,14 +668,12 @@ Store task logs in S3. Note that the `druid-s3-extensions` extension must be loa
 
 ##### Azure Blob Store task logs
 
-Store task logs in Azure Blob Store.
+Store task logs in Azure Blob Store. To enable this feature, load the `druid-azure-extensions` extension, and configure deep storage for Azure. Druid uses the same authentication method configured for deep storage and stores task logs in the same storage account (set in `druid.azure.account`).
 
-Note: The `druid-azure-extensions` extension must be loaded, and this uses the same storage account as the deep storage module for azure.
-
-|Property|Description|Default|
-|--------|-----------|-------|
-|`druid.indexer.logs.container`|The Azure Blob Store container to write logs to|none|
-|`druid.indexer.logs.prefix`|The path to prepend to logs|none|
+| Property | Description | Default |
+|---|---|---|
+| `druid.indexer.logs.container` | The Azure Blob Store container to write logs to. | Must be set. |
+| `druid.indexer.logs.prefix` | The path to prepend to logs. | Must be set. |
 
 ##### Google Cloud Storage task logs
 
@@ -714,7 +712,7 @@ You can configure Druid API error responses to hide internal information like th
 |`druid.server.http.showDetailedJettyErrors`|When set to true, any error from the Jetty layer / Jetty filter includes the following fields  in the JSON response: `servlet`, `message`, `url`, `status`, and `cause`, if it exists. When set to false, the JSON response only includes `message`, `url`, and `status`. The field values remain unchanged.|true|
 |`druid.server.http.errorResponseTransform.strategy`|Error response transform strategy. The strategy controls how Druid transforms error responses from Druid services. When unset or set to `none`, Druid leaves error responses unchanged.|`none`|
 
-##### Error response transform strategy
+#### Error response transform strategy
 
 You can use an error response transform strategy to transform error responses from within Druid services to hide internal information.
 When you specify an error response transform strategy other than `none`, Druid transforms the error responses from Druid services as follows:
@@ -723,12 +721,12 @@ When you specify an error response transform strategy other than `none`, Druid t
 * For any SQL query API that fails, for example `POST /druid/v2/sql/...`, Druid sets the fields `errorClass` and `host` to null. Druid applies the transformation strategy to the `errorMessage` field.
 * For any JDBC related exceptions, Druid will turn all checked exceptions into `QueryInterruptedException` otherwise druid will attempt to keep the exception as the same type. For example if the original exception isn't owned by Druid it will become `QueryInterruptedException`. Druid applies the transformation strategy to the `errorMessage` field.
 
-###### No error response transform strategy
+##### No error response transform strategy
 
 In this mode, Druid leaves error responses from underlying services unchanged and returns the unchanged errors to the API client.
 This is the default Druid error response mode. To explicitly enable this strategy, set `druid.server.http.errorResponseTransform.strategy` to `none`.
 
-###### Allowed regular expression error response transform strategy
+##### Allowed regular expression error response transform strategy
 
 In this mode, Druid validates the error responses from underlying services against a list of regular expressions. Only error messages that match a configured regular expression are returned. To enable this strategy, set `druid.server.http.errorResponseTransform.strategy` to `allowedRegex`.
 
@@ -774,7 +772,7 @@ This config is used to find the [Coordinator](../design/coordinator.md) using Cu
 
 You can configure how to announce and unannounce Znodes in ZooKeeper (using Curator). For normal operations you do not need to override any of these configs.
 
-##### Batch data segment announcer
+#### Batch data segment announcer
 
 In current Druid, multiple data segments may be announced under the same Znode.
 
@@ -2037,7 +2035,7 @@ A simple in-memory LRU cache. Local cache resides in JVM heap memory, so if you
 |Property|Description|Default|
 |--------|-----------|-------|
 |`druid.cache.sizeInBytes`|Maximum cache size in bytes. Zero disables caching.|0|
-|`druid.cache.initialSize`|Initial size of the hashtable backing the cache.|500000|
+|`druid.cache.initialSize`|Initial size of the hash table backing the cache.|500000|
 |`druid.cache.logEvictionCount`|If non-zero, log cache eviction every `logEvictionCount` items.|0|
 
 #### Caffeine cache
diff --git a/docs/development/extensions-core/azure.md b/docs/development/extensions-core/azure.md
index 21e24153a47..d6310e32cf9 100644
--- a/docs/development/extensions-core/azure.md
+++ b/docs/development/extensions-core/azure.md
@@ -22,25 +22,75 @@ title: "Microsoft Azure"
   ~ under the License.
   -->
 
+## Azure extension
+
+This extension allows you to do the following:
+
+* [Ingest data](#ingest-data-from-azure) from objects stored in Azure Blob Storage.
+* [Write segments](#store-segments-in-azure) to Azure Blob Storage for deep storage.
+* [Persist task logs](#persist-task-logs-in-azure) to Azure Blob Storage for long-term storage.
+
+:::info
 
 To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-azure-extensions` in the extensions load list.
 
-## Deep Storage
+:::
 
-[Microsoft Azure Storage](http://azure.microsoft.com/en-us/services/storage/) is another option for deep storage. This requires some additional Druid configuration.
+### Ingest data from Azure
 
-|Property|Description|Possible Values|Default|
-|--------|---------------|-----------|-------|
-|`druid.storage.type`|azure||Must be set.|
-|`druid.azure.account`||Azure Storage account name.|Must be set.|
-|`druid.azure.key`||Azure Storage account key.|Optional. Set one of key, sharedAccessStorageToken or useAzureCredentialsChain.|
-|`druid.azure.sharedAccessStorageToken`||Azure Shared Storage access token|Optional. Set one of key, sharedAccessStorageToken or useAzureCredentialsChain..| 
-|`druid.azure.useAzureCredentialsChain`|Use [DefaultAzureCredential](https://learn.microsoft.com/en-us/java/api/overview/azure/identity-readme?view=azure-java-stable) for authentication|Optional. Set one of key, sharedAccessStorageToken or useAzureCredentialsChain.|False|
-|`druid.azure.managedIdentityClientId`|If you want to use managed identity authentication in the `DefaultAzureCredential`, `useAzureCredentialsChain` must be true.||Optional.| 
-|`druid.azure.container`||Azure Storage container name.|Must be set.|
-|`druid.azure.prefix`|A prefix string that will be prepended to the blob names for the segments published to Azure deep storage| |""|
-|`druid.azure.protocol`|the protocol to use|http or https|https|
-|`druid.azure.maxTries`|Number of tries before canceling an Azure operation.| |3|
-|`druid.azure.maxListingLength`|maximum number of input files matching a given prefix to retrieve at a time| |1024|
-|`druid.azure.storageAccountEndpointSuffix`| The endpoint suffix to use. Use this config instead of `druid.azure.endpointSuffix`. Override the default value to connect to [Azure Government](https://learn.microsoft.com/en-us/azure/azure-government/documentation-government-get-started-connect-to-storage#getting-started-with-storage-api). This config supports storage accounts enabled for [AzureDNSZone](https://learn.microsoft.com/en-us/azure/dns/dns-getstarted-portal). Note: do not include the storage account name prefix in this config value. | Examples: `ABCD1234.blob.storage.azure.net`, `blob.core.usgovcloudapi.net`| `blob.core.windows.net`|
-See [Azure Services](http://azure.microsoft.com/en-us/pricing/free-trial/) for more information.
+Ingest data using either [MSQ](../../multi-stage-query/index.md) or a native batch [parallel task](../../ingestion/native-batch.md) with an [Azure input source](../../ingestion/input-sources.md#azure-input-source) (`azureStorage`) to read objects directly from Azure Blob Storage.
+
+### Store segments in Azure
+
+:::info
+
+To use Azure for deep storage, set `druid.storage.type=azure`.
+
+:::
+
+#### Configure location
+
+Configure where to store segments using the following properties:
+
+| Property | Description | Default |
+|---|---|---|
+| `druid.azure.account` | The Azure Storage account name. | Must be set. |
+| `druid.azure.container` | The Azure Storage container name. | Must be set. |
+| `druid.azure.prefix` | A prefix string that will be prepended to the blob names for the segments published. | "" |
+| `druid.azure.maxTries` | Number of tries before canceling an Azure operation. | 3 |
+| `druid.azure.protocol` | The protocol to use to connect to the Azure Storage account. Either `http` or `https`. | `https` |
+| `druid.azure.storageAccountEndpointSuffix` | The Storage account endpoint to use. Override the default value to connect to [Azure Government](https://learn.microsoft.com/en-us/azure/azure-government/documentation-government-get-started-connect-to-storage#getting-started-with-storage-api) or storage accounts with [Azure DNS zone endpoints](https://learn.microsoft.com/en-us/azure/storage/common/storage-account-overview#azure-dns-zone-endpoints-preview).<br/><br/>Do _not_ include the storage account name prefix in this config value.<br/><br/>Examples: `ABCD1234.blob.storage.azure.net`, `blob.core.usgovcloudapi.net`. | `blob.core.windows.net` |
+
+#### Configure authentication
+
+Authenticate access to Azure Blob Storage using one of the following methods:
+
+* [SAS token](https://learn.microsoft.com/en-us/azure/storage/common/storage-sas-overview)
+* [Shared Key](https://learn.microsoft.com/en-us/rest/api/storageservices/authorize-with-shared-key)
+* Default Azure credentials chain ([`DefaultAzureCredential`](https://learn.microsoft.com/en-us/java/api/overview/azure/identity-readme#defaultazurecredential)).
+
+Configure authentication using the following properties:
+
+| Property | Description | Default |
+|---|---|---|
+| `druid.azure.sharedAccessStorageToken` | The SAS (Shared Storage Access) token. |  |
+| `druid.azure.key` | The Shared Key. |  |
+| `druid.azure.useAzureCredentialsChain` | If `true`, use `DefaultAzureCredential` for authentication. | `false` |
+| `druid.azure.managedIdentityClientId` | To use managed identity authentication in the `DefaultAzureCredential`, set `useAzureCredentialsChain` to `true` and provide the client ID here. |  |
+
+### Persist task logs in Azure
+
+:::info
+
+To persist task logs in Azure Blob Storage, set `druid.indexer.logs.type=azure`.
+
+:::
+
+Druid stores task logs using the storage account and authentication method configured for storing segments. Use the following configuration to set up where to store the task logs:
+
+| Property | Description | Default |
+|---|---|---|
+| `druid.indexer.logs.container` | The Azure Blob Store container to write logs to. | Must be set. |
+| `druid.indexer.logs.prefix` | The path to prepend to logs. | Must be set. |
+
+For general options regarding task retention, see [Log retention policy](../../configuration/index.md#log-retention-policy).
diff --git a/docs/development/extensions-core/hdfs.md b/docs/development/extensions-core/hdfs.md
index 32ef6133a9d..b1d2d0ceaab 100644
--- a/docs/development/extensions-core/hdfs.md
+++ b/docs/development/extensions-core/hdfs.md
@@ -22,7 +22,6 @@ title: "HDFS"
   ~ under the License.
   -->
 
-
 To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-hdfs-storage` in the extensions load list and run druid processes with `GOOGLE_APPLICATION_CREDENTIALS=/path/to/service_account_keyfile` in the environment.
 
 ## Deep Storage
@@ -44,11 +43,11 @@ If you want to eagerly authenticate against a secured hadoop/hdfs cluster you mu
 
 ### Configuration for Cloud Storage
 
-You can also use the AWS S3 or the Google Cloud Storage as the deep storage via HDFS.
+You can also use the Amazon S3 or the Google Cloud Storage as the deep storage via HDFS.
 
-#### Configuration for AWS S3
+#### Configuration for Amazon S3
 
-To use the AWS S3 as the deep storage, you need to configure `druid.storage.storageDirectory` properly.
+To use the Amazon S3 as the deep storage, you need to configure `druid.storage.storageDirectory` properly.
 
 |Property|Possible Values|Description|Default|
 |--------|---------------|-----------|-------|
diff --git a/docs/development/extensions-core/s3.md b/docs/development/extensions-core/s3.md
index 20bd1682f24..ab8745f6e3b 100644
--- a/docs/development/extensions-core/s3.md
+++ b/docs/development/extensions-core/s3.md
@@ -25,6 +25,7 @@ title: "S3-compatible"
 ## S3 extension
 
 This extension allows you to do 2 things:
+
 * [Ingest data](#reading-data-from-s3) from files stored in S3.
 * Write segments to [deep storage](#deep-storage) in S3.
 
@@ -41,7 +42,7 @@ To read objects from S3, you must supply [connection information](#configuration
 
 ### Deep Storage
 
-S3-compatible deep storage means either AWS S3 or a compatible service like Google Storage which exposes the same API as S3.
+S3-compatible deep storage means either Amazon S3 or a compatible service like Google Storage which exposes the same API as S3.
 
 S3 deep storage needs to be explicitly enabled by setting `druid.storage.type=s3`. **Only after setting the storage type to S3 will any of the settings below take effect.**
 
@@ -97,19 +98,19 @@ Note that this setting only affects Druid's behavior. Changing S3 to use Object
 
 If you're using ACLs, Druid needs the following permissions:
 
-- `s3:GetObject`
-- `s3:PutObject`
-- `s3:DeleteObject`
-- `s3:GetBucketAcl`
-- `s3:PutObjectAcl`
+* `s3:GetObject`
+* `s3:PutObject`
+* `s3:DeleteObject`
+* `s3:GetBucketAcl`
+* `s3:PutObjectAcl`
 
 #### Object Ownership permissions
 
 If you're using Object Ownership, Druid needs the following permissions:
 
-- `s3:GetObject`
-- `s3:PutObject`
-- `s3:DeleteObject`
+* `s3:GetObject`
+* `s3:PutObject`
+* `s3:DeleteObject`
 
 ### AWS region
 
@@ -117,8 +118,8 @@ The AWS SDK requires that a target region be specified.  You can set these by us
 
 For example, to set the region to 'us-east-1' through system properties:
 
-- Add `-Daws.region=us-east-1` to the `jvm.config` file for all Druid services.
-- Add `-Daws.region=us-east-1` to `druid.indexer.runner.javaOpts` in [Middle Manager configuration](../../configuration/index.md#middlemanager-configuration) so that the property will be passed to Peon (worker) processes.
+* Add `-Daws.region=us-east-1` to the `jvm.config` file for all Druid services.
+* Add `-Daws.region=us-east-1` to `druid.indexer.runner.javaOpts` in [Middle Manager configuration](../../configuration/index.md#middlemanager-configuration) so that the property will be passed to Peon (worker) processes.
 
 ### Connecting to S3 configuration
 
@@ -146,6 +147,6 @@ For example, to set the region to 'us-east-1' through system properties:
 You can enable [server-side encryption](https://docs.aws.amazon.com/AmazonS3/latest/dev/serv-side-encryption) by setting
 `druid.storage.sse.type` to a supported type of server-side encryption. The current supported types are:
 
-- s3: [Server-side encryption with S3-managed encryption keys](https://docs.aws.amazon.com/AmazonS3/latest/dev/UsingServerSideEncryption)
-- kms: [Server-side encryption with AWS KMS–Managed Keys](https://docs.aws.amazon.com/AmazonS3/latest/dev/UsingKMSEncryption)
-- custom: [Server-side encryption with Customer-Provided Encryption Keys](https://docs.aws.amazon.com/AmazonS3/latest/dev/ServerSideEncryptionCustomerKeys)
+* s3: [Server-side encryption with S3-managed encryption keys](https://docs.aws.amazon.com/AmazonS3/latest/dev/UsingServerSideEncryption)
+* kms: [Server-side encryption with AWS KMS–Managed Keys](https://docs.aws.amazon.com/AmazonS3/latest/dev/UsingKMSEncryption)
+* custom: [Server-side encryption with Customer-Provided Encryption Keys](https://docs.aws.amazon.com/AmazonS3/latest/dev/ServerSideEncryptionCustomerKeys)
diff --git a/docs/ingestion/hadoop.md b/docs/ingestion/hadoop.md
index c34fdb92117..96373e27517 100644
--- a/docs/ingestion/hadoop.md
+++ b/docs/ingestion/hadoop.md
@@ -148,7 +148,7 @@ For example, using the static input paths:
 "paths" : "hdfs://path/to/data/is/here/data.gz,hdfs://path/to/data/is/here/moredata.gz,hdfs://path/to/data/is/here/evenmoredata.gz"
 ```
 
-You can also read from cloud storage such as AWS S3 or Google Cloud Storage.
+You can also read from cloud storage such as Amazon S3 or Google Cloud Storage.
 To do so, you need to install the necessary library under Druid's classpath in _all MiddleManager or Indexer processes_.
 For S3, you can run the below command to install the [Hadoop AWS module](https://hadoop.apache.org/docs/stable/hadoop-aws/tools/hadoop-aws/).
 
@@ -336,7 +336,7 @@ The tuningConfig is optional and default parameters will be used if no tuningCon
 |logParseExceptions|Boolean|If true, log an error message when a parsing exception occurs, containing information about the row where the error occurred.|no(default = false)|
 |maxParseExceptions|Integer|The maximum number of parse exceptions that can occur before the task halts ingestion and fails. Overrides `ignoreInvalidRows` if `maxParseExceptions` is defined.|no(default = unlimited)|
 |useYarnRMJobStatusFallback|Boolean|If the Hadoop jobs created by the indexing task are unable to retrieve their completion status from the JobHistory server, and this parameter is true, the indexing task will try to fetch the application status from `http://<yarn-rm-address>/ws/v1/cluster/apps/<application-id>`, where `<yarn-rm-address>` is the value of `yarn.resourcemanager.webapp.address` in your Hadoop configuration. This flag is intended as a fallback for cases where an indexing task's jobs succeed, but the JobHistory server is unavailable, causing the indexing task to fail because it cannot determine the job statuses.|no (default = true)|
-|awaitSegmentAvailabilityTimeoutMillis|Long|Milliseconds to wait for the newly indexed segments to become available for query after ingestion completes. If `<= 0`, no wait will occur. If `> 0`, the task will wait for the Coordinator to indicate that the new segments are available for querying. If the timeout expires, the task will exit as successful, but the segments were not confirmed to have become available for query.|no (default = 0)| 
+|awaitSegmentAvailabilityTimeoutMillis|Long|Milliseconds to wait for the newly indexed segments to become available for query after ingestion completes. If `<= 0`, no wait will occur. If `> 0`, the task will wait for the Coordinator to indicate that the new segments are available for querying. If the timeout expires, the task will exit as successful, but the segments were not confirmed to have become available for query.|no (default = 0)|
 
 ### `jobProperties`
 
diff --git a/docs/ingestion/input-sources.md b/docs/ingestion/input-sources.md
index f89693740c8..fb8e1f98c91 100644
--- a/docs/ingestion/input-sources.md
+++ b/docs/ingestion/input-sources.md
@@ -30,12 +30,15 @@ For general information on native batch indexing and parallel task indexing, see
 ## S3 input source
 
 :::info
- You need to include the [`druid-s3-extensions`](../development/extensions-core/s3.md) as an extension to use the S3 input source.
+
+You need to include the [`druid-s3-extensions`](../development/extensions-core/s3.md) as an extension to use the S3 input source.
+
 :::
 
 The S3 input source reads objects directly from S3. You can specify either:
-- a list of S3 URI strings
-- a list of S3 location prefixes that attempts to list the contents and ingest
+
+* a list of S3 URI strings
+* a list of S3 location prefixes that attempts to list the contents and ingest
 all objects contained within the locations.
 
 The S3 input source is splittable. Therefore, you can use it with the [Parallel task](./native-batch.md). Each worker task of `index_parallel` reads one or multiple objects.
@@ -76,7 +79,6 @@ Sample specs:
 ...
 ```
 
-
 ```json
 ...
     "ioConfig": {
@@ -210,13 +212,17 @@ Properties Object:
 |assumeRoleExternalId|A unique identifier that might be required when you assume a role in another account [see](https://docs.aws.amazon.com/IAM/latest/UserGuide/id_credentials_temp_request.html)|None|no|
 
 :::info
- **Note:** If `accessKeyId` and `secretAccessKey` are not given, the default [S3 credentials provider chain](../development/extensions-core/s3.md#s3-authentication-methods) is used.
+
+If `accessKeyId` and `secretAccessKey` are not given, the default [S3 credentials provider chain](../development/extensions-core/s3.md#s3-authentication-methods) is used.
+
 :::
 
 ## Google Cloud Storage input source
 
 :::info
- You need to include the [`druid-google-extensions`](../development/extensions-core/google.md) as an extension to use the Google Cloud Storage input source.
+
+You need to include the [`druid-google-extensions`](../development/extensions-core/google.md) as an extension to use the Google Cloud Storage input source.
+
 :::
 
 The Google Cloud Storage input source is to support reading objects directly
@@ -261,7 +267,6 @@ Sample specs:
 ...
 ```
 
-
 ```json
 ...
     "ioConfig": {
@@ -300,16 +305,18 @@ Google Cloud Storage object:
 |path|The path where data is located.|None|yes|
 |systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (Google Cloud Storage URI starting with `gs://`), `__file_bucket` (GCS bucket), and `__file_path` (GCS key).|None|no|
 
-## Azure input source 
+## Azure input source
 
 :::info
- You need to include the [`druid-azure-extensions`](../development/extensions-core/azure.md) as an extension to use the Azure input source.
+
+You need to include the [`druid-azure-extensions`](../development/extensions-core/azure.md) as an extension to use the Azure input source.
+
 :::
 
 The Azure input source (that uses the type `azureStorage`) reads objects directly from Azure Blob store or Azure Data Lake sources. You can
 specify objects as a list of file URI strings or prefixes. You can split the Azure input source for use with [Parallel task](./native-batch.md) indexing and each worker task reads one chunk of the split data.
 
-The `azureStorage` input source is a new schema for Azure input sources that allows you to specify which storage account files should be ingested from. We recommend that you update any specs that use the old `azure` schema to use the new `azureStorage` schema. The new schema provides more functionality than the older `azure` schema. 
+The `azureStorage` input source is a new schema for Azure input sources that allows you to specify which storage account files should be ingested from. We recommend that you update any specs that use the old `azure` schema to use the new `azureStorage` schema. The new schema provides more functionality than the older `azure` schema.
 
 Sample specs:
 
@@ -347,7 +354,6 @@ Sample specs:
 ...
 ```
 
-
 ```json
 ...
     "ioConfig": {
@@ -379,7 +385,7 @@ Sample specs:
 |objects|JSON array of Azure objects to ingest.|None|One of the following must be set:`uris`, `prefixes`, or `objects`.|
 |objectGlob|A glob for the object part of the Azure URI. In the URI `azureStorage://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `azureStorage://foo/bar/file.json` because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/javase/8/docs/api/java/nio/file/FileSystem.html#getPathMatcher-java.lang.String-).|None|no|
 |systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (Azure blob URI starting with `azureStorage://`), `__file_bucket` (Azure bucket), and `__file_path` (Azure object path).|None|no|
-|properties|Properties object for overriding the default Azure configuration. See below for more information.|None|No (defaults will be used if not given)
+|properties|Properties object for overriding the default Azure configuration. See below for more information.|None|No (defaults will be used if not given)|
 
 Note that the Azure input source skips all empty objects only when `prefixes` is specified.
 
@@ -390,14 +396,12 @@ The `objects` property can one of the following:
 |bucket|Name of the Azure Blob Storage or Azure Data Lake storage account|None|yes|
 |path|The container and path where data is located.|None|yes|
 
-
 The `properties` property can be one of the following:
 
-- `sharedAccessStorageToken`
-- `key` 
-- `appRegistrationClientId`, `appRegistrationClientSecret`, and `tenantId` 
-- empty
-
+* `sharedAccessStorageToken`
+* `key`
+* `appRegistrationClientId`, `appRegistrationClientSecret`, and `tenantId`
+* empty
 
 |Property|Description|Default|Required|
 |--------|-----------|-------|---------|
@@ -407,8 +411,7 @@ The `properties` property can be one of the following:
 |appRegistrationClientSecret|The client secret of the Azure App registration to authenticate as|None|Yes if `appRegistrationClientId` is provided|
 |tenantId|The tenant ID of the Azure App registration to authenticate as|None|Yes if `appRegistrationClientId` is provided|
 
-
-#### `azure` input source
+### Legacy `azure` input source
 
 The Azure input source that uses the type `azure` is an older version of the Azure input type and is not recommended. It doesn't support specifying which storage account to ingest from. We recommend using the [`azureStorage` input source schema](#azure-input-source) instead since it provides more functionality.
 
@@ -448,7 +451,6 @@ Sample specs:
 ...
 ```
 
-
 ```json
 ...
     "ioConfig": {
@@ -487,11 +489,12 @@ The `objects` property is:
 |bucket|Name of the Azure Blob Storage or Azure Data Lake container|None|yes|
 |path|The path where data is located.|None|yes|
 
-
 ## HDFS input source
 
 :::info
- You need to include the [`druid-hdfs-storage`](../development/extensions-core/hdfs.md) as an extension to use the HDFS input source.
+
+You need to include the [`druid-hdfs-storage`](../development/extensions-core/hdfs.md) as an extension to use the HDFS input source.
+
 :::
 
 The HDFS input source is to support reading files directly
@@ -580,10 +583,12 @@ in `druid.ingestion.hdfs.allowedProtocols`. See [HDFS input source security conf
 
 The HTTP input source is to support reading files directly from remote sites via HTTP.
 
-:::info
- **Security notes:** Ingestion tasks run under the operating system account that runs the Druid processes, for example the Indexer, Middle Manager, and Peon. This means any user who can submit an ingestion task can specify an input source referring to any location that the Druid process can access. For example, using `http` input source, users may have access to internal network servers.
+:::info Security notes
+
+Ingestion tasks run under the operating system account that runs the Druid processes, for example the Indexer, Middle Manager, and Peon. This means any user who can submit an ingestion task can specify an input source referring to any location that the Druid process can access. For example, using `http` input source, users may have access to internal network servers.
+
+The `http` input source is not limited to the HTTP or HTTPS protocols. It uses the Java URI class that supports HTTP, HTTPS, FTP, file, and jar protocols by default.
 
- The `http` input source is not limited to the HTTP or HTTPS protocols. It uses the Java URI class that supports HTTP, HTTPS, FTP, file, and jar protocols by default.
 :::
 
 For more information about security best practices, see [Security overview](../operations/security-overview.md#best-practices).
@@ -725,7 +730,7 @@ Sample spec:
 |filter|A wildcard filter for files. See [here](http://commons.apache.org/proper/commons-io/apidocs/org/apache/commons/io/filefilter/WildcardFileFilter) for more information. Files matching the filter criteria are considered for ingestion. Files not matching the filter criteria are ignored.|yes if `baseDir` is specified|
 |baseDir|Directory to search recursively for files to be ingested. Empty files under the `baseDir` will be skipped.|At least one of `baseDir` or `files` should be specified|
 |files|File paths to ingest. Some files can be ignored to avoid ingesting duplicate files if they are located under the specified `baseDir`. Empty files will be skipped.|At least one of `baseDir` or `files` should be specified|
-|systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (File URI starting with `file:`) and `__file_path` (file path).|None|no|
+|systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (File URI starting with `file:`) and `__file_path` (file path).|no|
 
 ## Druid input source
 
@@ -744,9 +749,9 @@ no `inputFormat` field needs to be specified in the ingestion spec when using th
 
 The Druid input source can be used for a variety of purposes, including:
 
-- Creating new datasources that are rolled-up copies of existing datasources.
-- Changing the [partitioning or sorting](./partitioning.md) of a datasource to improve performance.
-- Updating or removing rows using a [`transformSpec`](./ingestion-spec.md#transformspec).
+* Creating new datasources that are rolled-up copies of existing datasources.
+* Changing the [partitioning or sorting](./partitioning.md) of a datasource to improve performance.
+* Updating or removing rows using a [`transformSpec`](./ingestion-spec.md#transformspec).
 
 When using the Druid input source, the timestamp column shows up as a numeric field named `__time` set to the number
 of milliseconds since the epoch (January 1, 1970 00:00:00 UTC). It is common to use this in the timestampSpec, if you
@@ -813,16 +818,16 @@ rolled-up datasource `wikipedia_rollup` by grouping on hour, "countryName", and
 ```
 
 :::info
- Note: Older versions (0.19 and earlier) did not respect the timestampSpec when using the Druid input source. If you
- have ingestion specs that rely on this and cannot rewrite them, set
- [`druid.indexer.task.ignoreTimestampSpecForDruidInputSource`](../configuration/index.md#indexer-general-configuration)
- to `true` to enable a compatibility mode where the timestampSpec is ignored.
+
+Older versions (0.19 and earlier) did not respect the timestampSpec when using the Druid input source. If you have ingestion specs that rely on this and cannot rewrite them, set [`druid.indexer.task.ignoreTimestampSpecForDruidInputSource`](../configuration/index.md#indexer-general-configuration) to `true` to enable a compatibility mode where the timestampSpec is ignored.
+
 :::
 
 The [secondary partitioning method](native-batch.md#partitionsspec) determines the requisite number of concurrent worker tasks that run in parallel to complete ingestion with the Combining input source.
 Set this value in `maxNumConcurrentSubTasks` in `tuningConfig` based on the secondary partitioning method:
-- `range` or `single_dim` partitioning: greater than or equal to 1
-- `hashed` or `dynamic` partitioning: greater than or equal to 2
+
+* `range` or `single_dim` partitioning: greater than or equal to 1
+* `hashed` or `dynamic` partitioning: greater than or equal to 2
 
 For more information on the `maxNumConcurrentSubTasks` field, see [Implementation considerations](native-batch.md#implementation-considerations).
 
@@ -866,7 +871,7 @@ The following is an example of an SQL input source spec:
 The spec above will read all events from two separate SQLs for the interval `2013-01-01/2013-01-02`.
 Each of the SQL queries will be run in its own sub-task and thus for the above example, there would be two sub-tasks.
 
-**Recommended practices**
+### Recommended practices
 
 Compared to the other native batch input sources, SQL input source behaves differently in terms of reading the input data. Therefore, consider the following points before using this input source in a production environment:
 
@@ -878,7 +883,6 @@ Compared to the other native batch input sources, SQL input source behaves diffe
 
 * Similar to file-based input formats, any updates to existing data will replace the data in segments specific to the intervals specified in the `granularitySpec`.
 
-
 ## Combining input source
 
 The Combining input source lets you read data from multiple input sources.
@@ -928,7 +932,9 @@ The following is an example of a Combining input source spec:
 ## Iceberg input source
 
 :::info
+
 To use the Iceberg input source, load the extension [`druid-iceberg-extensions`](../development/extensions-contrib/iceberg.md).
+
 :::
 
 You use the Iceberg input source to read data stored in the Iceberg table format. For a given table, the input source scans up to the latest Iceberg snapshot from the configured Hive catalog. Druid ingests the underlying live data files using the existing input source formats.
@@ -1133,13 +1139,15 @@ This input source provides the following filters: `and`, `equals`, `interval`, a
 ## Delta Lake input source
 
 :::info
+
 To use the Delta Lake input source, load the extension [`druid-deltalake-extensions`](../development/extensions-contrib/delta-lake.md).
+
 :::
 
 You can use the Delta input source to read data stored in a Delta Lake table. For a given table, the input source scans
 the latest snapshot from the configured table. Druid ingests the underlying delta files from the table.
 
- | Property|Description|Required|
+| Property|Description|Required|
 |---------|-----------|--------|
 | type|Set this value to `delta`.|yes|
 | tablePath|The location of the Delta table.|yes|
@@ -1155,7 +1163,6 @@ on statistics collected when the non-partitioned table is created. In this scena
 data that doesn't match the filter. To guarantee that the Delta Kernel prunes out unnecessary column values, only use
 filters on partitioned columns.
 
-
 `and` filter:
 
 | Property | Description                                                                                                                                                   | Required |
@@ -1217,7 +1224,6 @@ filters on partitioned columns.
 | column   | The table column to apply the filter on. | yes      |
 | value    | The value to use in the filter.          | yes      |
 
-
 The following is a sample spec to read all records from the Delta table `/delta-table/foo`:
 
 ```json
diff --git a/docs/ingestion/native-batch.md b/docs/ingestion/native-batch.md
index fc234cce0a2..398fea9f69a 100644
--- a/docs/ingestion/native-batch.md
+++ b/docs/ingestion/native-batch.md
@@ -28,12 +28,14 @@ sidebar_label: JSON-based batch
 :::
 
 Apache Druid supports the following types of JSON-based batch indexing tasks:
+
 - Parallel task indexing (`index_parallel`) that can run multiple indexing tasks concurrently. Parallel task works well for production ingestion tasks.
 - Simple task indexing (`index`) that run a single indexing task at a time. Simple task indexing is suitable for development and test environments.
 
 This topic covers the configuration for `index_parallel` ingestion specs.
 
 For related information on batch indexing, see:
+
 - [Batch ingestion method comparison table](./index.md#batch) for a comparison of batch ingestion methods.
 - [Tutorial: Loading a file](../tutorials/tutorial-batch.md) for a tutorial on JSON-based batch ingestion.
 - [Input sources](./input-sources.md) for possible input sources.
@@ -97,7 +99,6 @@ By default, JSON-based batch ingestion replaces all data in the intervals in you
 
 You can also perform concurrent append and replace tasks. For more information, see [Concurrent append and replace](./concurrent-append-replace.md)
 
-
 #### Fully replacing existing segments using tombstones
 
 :::info
@@ -124,12 +125,12 @@ You want to re-ingest and overwrite with new data as follows:
 
 Unless you set `dropExisting` to true, the result after ingestion with overwrite using the same `MONTH` `segmentGranularity` would be:
 
-* **January**: 1 record  
-* **February**: 10 records  
-* **March**: 9 records
+- **January**: 1 record  
+- **February**: 10 records  
+- **March**: 9 records
 
 This may not be what it is expected since the new data has 0 records for January. Set `dropExisting` to true to replace the unneeded January segment with a tombstone.
-   
+
 ## Parallel indexing example
 
 The following example illustrates the configuration for a parallel indexing task.
@@ -214,6 +215,7 @@ The following example illustrates the configuration for a parallel indexing task
   }
 }
 ```
+
 </details>
 
 ## Parallel indexing configuration
@@ -305,7 +307,7 @@ The segments split hint spec is used only for [`DruidInputSource`](./input-sourc
 
 ### `partitionsSpec`
 
-The primary partition for Druid is time. You can define a secondary partitioning method in the partitions spec. Use the `partitionsSpec` type that applies for your [rollup](rollup.md) method. 
+The primary partition for Druid is time. You can define a secondary partitioning method in the partitions spec. Use the `partitionsSpec` type that applies for your [rollup](rollup.md) method.
 
 For perfect rollup, you can use:
 
@@ -366,7 +368,7 @@ In the `partial segment generation` phase, just like the Map phase in MapReduce,
 the Parallel task splits the input data based on the split hint spec
 and assigns each split to a worker task. Each worker task (type `partial_index_generate`) reads the assigned split, and partitions rows by the time chunk from `segmentGranularity` (primary partition key) in the `granularitySpec`
 and then by the hash value of `partitionDimensions` (secondary partition key) in the `partitionsSpec`.
-The partitioned data is stored in local storage of 
+The partitioned data is stored in local storage of
 the [middleManager](../design/middlemanager.md) or the [indexer](../design/indexer.md).
 
 The `partial segment merge` phase is similar to the Reduce phase in MapReduce.
@@ -709,12 +711,14 @@ The returned result contains the worker task spec, a current task status if exis
   "taskHistory": []
 }
 ```
+
 </details>
 
 `http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/subtaskspec/{SUB_TASK_SPEC_ID}/history`  
 Returns the task attempt history of the worker task spec of the given id, or HTTP 404 Not Found error if the supervisor task is running in the sequential mode.
 
 ## Segment pushing modes
+
 While ingesting data using the parallel task indexing, Druid creates segments from the input data and pushes them. For segment pushing,
 the parallel task index supports the following segment pushing modes based upon your type of [rollup](./rollup.md):
 
@@ -743,10 +747,12 @@ This may help the higher priority tasks to finish earlier than lower priority ta
 by assigning more task slots to them.
 
 ## Splittable input sources
+
 Use the `inputSource` object to define the location where your index can read data. Only the native parallel task and simple task support the input source.
 
 For details on available input sources see:
-- [S3 input source](./input-sources.md#s3-input-source) (`s3`) reads data from AWS S3 storage.
+
+- [S3 input source](./input-sources.md#s3-input-source) (`s3`) reads data from Amazon S3 storage.
 - [Google Cloud Storage input source](./input-sources.md#google-cloud-storage-input-source) (`gs`) reads data from Google Cloud Storage.
 - [Azure input source](./input-sources.md#azure-input-source) (`azure`) reads data from Azure Blob Storage and Azure Data Lake.
 - [HDFS input source](./input-sources.md#hdfs-input-source) (`hdfs`) reads data from HDFS storage.
diff --git a/website/.spelling b/website/.spelling
index 6bda08d608d..31b151a921d 100644
--- a/website/.spelling
+++ b/website/.spelling
@@ -216,6 +216,7 @@ ROUTINE_TYPE
 Rackspace
 Redis
 S3
+SAS
 SDK
 SIGAR
 SPNEGO

From 35709de54969cf9ba297884323e55273217981bf Mon Sep 17 00:00:00 2001
From: Adithya Chakilam <35785271+adithyachakilam@users.noreply.github.com>
Date: Thu, 20 Jun 2024 12:23:59 -0500
Subject: [PATCH 04/72] CgroupCpuSetMonitor: Initialize the cgroup discoverer
 (#16621)

---
 .../apache/druid/java/util/metrics/CgroupCpuSetMonitor.java    | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/processing/src/main/java/org/apache/druid/java/util/metrics/CgroupCpuSetMonitor.java b/processing/src/main/java/org/apache/druid/java/util/metrics/CgroupCpuSetMonitor.java
index 0534e00259f..84de0fd216d 100644
--- a/processing/src/main/java/org/apache/druid/java/util/metrics/CgroupCpuSetMonitor.java
+++ b/processing/src/main/java/org/apache/druid/java/util/metrics/CgroupCpuSetMonitor.java
@@ -24,6 +24,7 @@ import org.apache.druid.java.util.emitter.service.ServiceEmitter;
 import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 import org.apache.druid.java.util.metrics.cgroups.CgroupDiscoverer;
 import org.apache.druid.java.util.metrics.cgroups.CpuSet;
+import org.apache.druid.java.util.metrics.cgroups.ProcSelfCgroupDiscoverer;
 
 import java.util.Map;
 
@@ -41,7 +42,7 @@ public class CgroupCpuSetMonitor extends FeedDefiningMonitor
 
   public CgroupCpuSetMonitor(final Map<String, String[]> dimensions, String feed)
   {
-    this(null, dimensions, feed);
+    this(new ProcSelfCgroupDiscoverer(), dimensions, feed);
   }
 
   public CgroupCpuSetMonitor(final Map<String, String[]> dimensions)

From cd438b1918c1bf925e76ba97b6ce076cde831df4 Mon Sep 17 00:00:00 2001
From: Akshat Jain <akjn11@gmail.com>
Date: Fri, 21 Jun 2024 11:36:47 +0530
Subject: [PATCH 05/72] Emit metrics for S3UploadThreadPool (#16616)

* Emit metrics for S3UploadThreadPool

* Address review comments

* Revert unnecessary formatting change

* Revert unnecessary formatting change in metrics.md file

* Address review comments

* Add metric for task duration

* Minor fix in metrics.md

* Add s3Key and uploadId in the log message

* Address review comments

* Create new instance of ServiceMetricEvent.Builder for thread safety

* Address review comments

* Address review comments
---
 docs/operations/metrics.md                    | 13 ++++
 .../s3/output/RetryableS3OutputStream.java    | 22 ++++--
 .../storage/s3/output/S3UploadManager.java    | 75 ++++++++++++++-----
 .../s3/S3StorageConnectorProviderTest.java    |  4 +-
 .../output/RetryableS3OutputStreamTest.java   |  4 +-
 .../s3/output/S3StorageConnectorTest.java     |  4 +-
 .../s3/output/S3UploadManagerTest.java        |  9 ++-
 .../java/util/metrics/StubServiceEmitter.java |  4 +-
 8 files changed, 104 insertions(+), 31 deletions(-)

diff --git a/docs/operations/metrics.md b/docs/operations/metrics.md
index bf241ac5708..1d37169684e 100644
--- a/docs/operations/metrics.md
+++ b/docs/operations/metrics.md
@@ -508,6 +508,19 @@ These metrics are only available if the `OshiSysMonitor` module is included.
 |`sys/tcpv4/out/rsts`|Total "out reset" packets sent to reset the connection||Generally 0|
 |`sys/tcpv4/retrans/segs`|Total segments re-transmitted||Varies|
 
+
+## S3 multi-part upload
+
+These metrics are only available if the `druid-s3-extensions` module is included and if certain specific features are being used: MSQ export to S3, durable intermediate storage on S3.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`s3/upload/part/queueSize`|Number of items currently waiting in queue to be uploaded to S3. Each item in the queue corresponds to a single part in a multi-part upload.||Varies|
+|`s3/upload/part/queuedTime`|Milliseconds spent by a single item (or part) in queue before it starts getting uploaded to S3.|`uploadId`, `partNumber`|Varies|
+|`s3/upload/part/time`|Milliseconds taken to upload a single part of a multi-part upload to S3.|`uploadId`, `partNumber`|Varies|
+|`s3/upload/total/time`|Milliseconds taken for uploading all parts of a multi-part upload to S3.|`uploadId`|Varies|
+|`s3/upload/total/bytes`|Total bytes uploaded to S3 during a multi-part upload.|`uploadId`|Varies|
+
 ## Cgroup
 
 These metrics are available on operating systems with the cgroup kernel feature. All the values are derived by reading from `/sys/fs/cgroup`.
diff --git a/extensions-core/s3-extensions/src/main/java/org/apache/druid/storage/s3/output/RetryableS3OutputStream.java b/extensions-core/s3-extensions/src/main/java/org/apache/druid/storage/s3/output/RetryableS3OutputStream.java
index d0e5d0ee3ff..aa672444581 100644
--- a/extensions-core/s3-extensions/src/main/java/org/apache/druid/storage/s3/output/RetryableS3OutputStream.java
+++ b/extensions-core/s3-extensions/src/main/java/org/apache/druid/storage/s3/output/RetryableS3OutputStream.java
@@ -32,6 +32,7 @@ import org.apache.druid.java.util.common.FileUtils;
 import org.apache.druid.java.util.common.RetryUtils;
 import org.apache.druid.java.util.common.io.Closer;
 import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 import org.apache.druid.storage.s3.S3Utils;
 import org.apache.druid.storage.s3.ServerSideEncryptingAmazonS3;
 
@@ -69,6 +70,11 @@ import java.util.concurrent.TimeUnit;
  */
 public class RetryableS3OutputStream extends OutputStream
 {
+  // Metric related constants.
+  private static final String METRIC_PREFIX = "s3/upload/total/";
+  private static final String METRIC_TOTAL_UPLOAD_TIME = METRIC_PREFIX + "time";
+  private static final String METRIC_TOTAL_UPLOAD_BYTES = METRIC_PREFIX + "bytes";
+
   private static final Logger LOG = new Logger(RetryableS3OutputStream.class);
 
   private final S3OutputConfig config;
@@ -208,14 +214,20 @@ public class RetryableS3OutputStream extends OutputStream
       org.apache.commons.io.FileUtils.forceDelete(chunkStorePath);
       LOG.info("Deleted chunkStorePath[%s]", chunkStorePath);
 
-      // This should be emitted as a metric
-      long totalChunkSize = (currentChunk.id - 1) * chunkSize + currentChunk.length();
+      final long totalBytesUploaded = (currentChunk.id - 1) * chunkSize + currentChunk.length();
+      final long totalUploadTimeMillis = pushStopwatch.elapsed(TimeUnit.MILLISECONDS);
       LOG.info(
-          "Pushed total [%d] parts containing [%d] bytes in [%d]ms.",
+          "Pushed total [%d] parts containing [%d] bytes in [%d]ms for s3Key[%s], uploadId[%s].",
           futures.size(),
-          totalChunkSize,
-          pushStopwatch.elapsed(TimeUnit.MILLISECONDS)
+          totalBytesUploaded,
+          totalUploadTimeMillis,
+          s3Key,
+          uploadId
       );
+
+      final ServiceMetricEvent.Builder builder = new ServiceMetricEvent.Builder().setDimension("uploadId", uploadId);
+      uploadManager.emitMetric(builder.setMetric(METRIC_TOTAL_UPLOAD_TIME, totalUploadTimeMillis));
+      uploadManager.emitMetric(builder.setMetric(METRIC_TOTAL_UPLOAD_BYTES, totalBytesUploaded));
     });
 
     try (Closer ignored = closer) {
diff --git a/extensions-core/s3-extensions/src/main/java/org/apache/druid/storage/s3/output/S3UploadManager.java b/extensions-core/s3-extensions/src/main/java/org/apache/druid/storage/s3/output/S3UploadManager.java
index 9caa2bcb2e3..cc9ce4bf15a 100644
--- a/extensions-core/s3-extensions/src/main/java/org/apache/druid/storage/s3/output/S3UploadManager.java
+++ b/extensions-core/s3-extensions/src/main/java/org/apache/druid/storage/s3/output/S3UploadManager.java
@@ -25,10 +25,13 @@ import com.google.common.annotations.VisibleForTesting;
 import com.google.inject.Inject;
 import org.apache.druid.guice.ManageLifecycle;
 import org.apache.druid.java.util.common.RetryUtils;
+import org.apache.druid.java.util.common.Stopwatch;
 import org.apache.druid.java.util.common.concurrent.Execs;
 import org.apache.druid.java.util.common.lifecycle.LifecycleStart;
 import org.apache.druid.java.util.common.lifecycle.LifecycleStop;
 import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.java.util.emitter.service.ServiceEmitter;
+import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 import org.apache.druid.storage.s3.S3Utils;
 import org.apache.druid.storage.s3.ServerSideEncryptingAmazonS3;
 import org.apache.druid.utils.RuntimeInfo;
@@ -36,6 +39,7 @@ import org.apache.druid.utils.RuntimeInfo;
 import java.io.File;
 import java.util.concurrent.ExecutorService;
 import java.util.concurrent.Future;
+import java.util.concurrent.atomic.AtomicInteger;
 
 /**
  * This class manages uploading files to S3 in chunks, while ensuring that the
@@ -44,18 +48,34 @@ import java.util.concurrent.Future;
 @ManageLifecycle
 public class S3UploadManager
 {
+  // Metric related constants.
+  private static final String METRIC_PREFIX = "s3/upload/part/";
+  private static final String METRIC_PART_QUEUED_TIME = METRIC_PREFIX + "queuedTime";
+  private static final String METRIC_QUEUE_SIZE = METRIC_PREFIX + "queueSize";
+  private static final String METRIC_PART_UPLOAD_TIME = METRIC_PREFIX + "time";
+
   private final ExecutorService uploadExecutor;
+  private final ServiceEmitter emitter;
 
   private static final Logger log = new Logger(S3UploadManager.class);
 
+  // For metrics regarding uploadExecutor.
+  private final AtomicInteger executorQueueSize = new AtomicInteger(0);
+
   @Inject
-  public S3UploadManager(S3OutputConfig s3OutputConfig, S3ExportConfig s3ExportConfig, RuntimeInfo runtimeInfo)
+  public S3UploadManager(
+      S3OutputConfig s3OutputConfig,
+      S3ExportConfig s3ExportConfig,
+      RuntimeInfo runtimeInfo,
+      ServiceEmitter emitter
+  )
   {
     int poolSize = Math.max(4, runtimeInfo.getAvailableProcessors());
     int maxNumChunksOnDisk = computeMaxNumChunksOnDisk(s3OutputConfig, s3ExportConfig);
     this.uploadExecutor = createExecutorService(poolSize, maxNumChunksOnDisk);
     log.info("Initialized executor service for S3 multipart upload with pool size [%d] and work queue capacity [%d]",
              poolSize, maxNumChunksOnDisk);
+    this.emitter = emitter;
   }
 
   /**
@@ -87,25 +107,36 @@ public class S3UploadManager
       S3OutputConfig config
   )
   {
-    return uploadExecutor.submit(() -> RetryUtils.retry(
-        () -> {
-          log.debug("Uploading chunk[%d] for uploadId[%s].", chunkNumber, uploadId);
-          UploadPartResult uploadPartResult = uploadPartIfPossible(
-              s3Client,
-              uploadId,
-              config.getBucket(),
-              key,
-              chunkNumber,
-              chunkFile
-          );
-          if (!chunkFile.delete()) {
-            log.warn("Failed to delete chunk [%s]", chunkFile.getAbsolutePath());
-          }
-          return uploadPartResult;
-        },
-        S3Utils.S3RETRY,
-        config.getMaxRetry()
-    ));
+    final Stopwatch stopwatch = Stopwatch.createStarted();
+    executorQueueSize.incrementAndGet();
+    return uploadExecutor.submit(() -> {
+      final ServiceMetricEvent.Builder metricBuilder = new ServiceMetricEvent.Builder();
+      emitMetric(metricBuilder.setMetric(METRIC_QUEUE_SIZE, executorQueueSize.decrementAndGet()));
+      metricBuilder.setDimension("uploadId", uploadId).setDimension("partNumber", chunkNumber);
+      emitMetric(metricBuilder.setMetric(METRIC_PART_QUEUED_TIME, stopwatch.millisElapsed()));
+      stopwatch.restart();
+
+      return RetryUtils.retry(
+          () -> {
+            log.debug("Uploading chunk[%d] for uploadId[%s].", chunkNumber, uploadId);
+            UploadPartResult uploadPartResult = uploadPartIfPossible(
+                s3Client,
+                uploadId,
+                config.getBucket(),
+                key,
+                chunkNumber,
+                chunkFile
+            );
+            if (!chunkFile.delete()) {
+              log.warn("Failed to delete chunk [%s]", chunkFile.getAbsolutePath());
+            }
+            emitMetric(metricBuilder.setMetric(METRIC_PART_UPLOAD_TIME, stopwatch.millisElapsed()));
+            return uploadPartResult;
+          },
+          S3Utils.S3RETRY,
+          config.getMaxRetry()
+      );
+    });
   }
 
   @VisibleForTesting
@@ -149,4 +180,8 @@ public class S3UploadManager
     uploadExecutor.shutdown();
   }
 
+  protected void emitMetric(ServiceMetricEvent.Builder builder)
+  {
+    emitter.emit(builder);
+  }
 }
diff --git a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/S3StorageConnectorProviderTest.java b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/S3StorageConnectorProviderTest.java
index 676352daf4f..a880d6f2efa 100644
--- a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/S3StorageConnectorProviderTest.java
+++ b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/S3StorageConnectorProviderTest.java
@@ -32,6 +32,7 @@ import org.apache.druid.guice.JsonConfigProvider;
 import org.apache.druid.guice.LazySingleton;
 import org.apache.druid.guice.StartupInjectorBuilder;
 import org.apache.druid.java.util.common.HumanReadableBytes;
+import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.apache.druid.query.DruidProcessingConfigTest;
 import org.apache.druid.storage.StorageConnector;
 import org.apache.druid.storage.StorageConnectorModule;
@@ -158,7 +159,8 @@ public class S3StorageConnectorProviderTest
                 new S3UploadManager(
                     new S3OutputConfig("bucket", "prefix", EasyMock.mock(File.class), new HumanReadableBytes("5MiB"), 1),
                     new S3ExportConfig("tempDir", new HumanReadableBytes("5MiB"), 1, null),
-                    new DruidProcessingConfigTest.MockRuntimeInfo(10, 0, 0))
+                    new DruidProcessingConfigTest.MockRuntimeInfo(10, 0, 0),
+                    new StubServiceEmitter())
             )
     );
 
diff --git a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/RetryableS3OutputStreamTest.java b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/RetryableS3OutputStreamTest.java
index 8e7a81eb48d..8d15624c0d0 100644
--- a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/RetryableS3OutputStreamTest.java
+++ b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/RetryableS3OutputStreamTest.java
@@ -33,6 +33,7 @@ import com.amazonaws.services.s3.model.UploadPartResult;
 import org.apache.druid.java.util.common.HumanReadableBytes;
 import org.apache.druid.java.util.common.IOE;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.apache.druid.query.DruidProcessingConfigTest;
 import org.apache.druid.storage.s3.NoopServerSideEncryption;
 import org.apache.druid.storage.s3.ServerSideEncryptingAmazonS3;
@@ -105,7 +106,8 @@ public class RetryableS3OutputStreamTest
     s3UploadManager = new S3UploadManager(
         new S3OutputConfig("bucket", "prefix", EasyMock.mock(File.class), new HumanReadableBytes("5MiB"), 1),
         new S3ExportConfig("tempDir", new HumanReadableBytes("5MiB"), 1, null),
-        new DruidProcessingConfigTest.MockRuntimeInfo(10, 0, 0));
+        new DruidProcessingConfigTest.MockRuntimeInfo(10, 0, 0),
+        new StubServiceEmitter());
   }
 
   @Test
diff --git a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/S3StorageConnectorTest.java b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/S3StorageConnectorTest.java
index 67dcb3b6db6..68eaca1c42a 100644
--- a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/S3StorageConnectorTest.java
+++ b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/S3StorageConnectorTest.java
@@ -32,6 +32,7 @@ import com.amazonaws.services.s3.model.S3ObjectSummary;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.Lists;
 import org.apache.druid.java.util.common.HumanReadableBytes;
+import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.apache.druid.query.DruidProcessingConfigTest;
 import org.apache.druid.storage.StorageConnector;
 import org.apache.druid.storage.s3.NoopServerSideEncryption;
@@ -90,7 +91,8 @@ public class S3StorageConnectorTest
       storageConnector = new S3StorageConnector(s3OutputConfig, service, new S3UploadManager(
           s3OutputConfig,
           new S3ExportConfig("tempDir", new HumanReadableBytes("5MiB"), 1, null),
-          new DruidProcessingConfigTest.MockRuntimeInfo(10, 0, 0)));
+          new DruidProcessingConfigTest.MockRuntimeInfo(10, 0, 0),
+          new StubServiceEmitter()));
     }
     catch (IOException e) {
       throw new RuntimeException(e);
diff --git a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/S3UploadManagerTest.java b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/S3UploadManagerTest.java
index b79c392844d..75305a3c95a 100644
--- a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/S3UploadManagerTest.java
+++ b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/S3UploadManagerTest.java
@@ -22,6 +22,7 @@ package org.apache.druid.storage.s3.output;
 import com.amazonaws.services.s3.model.UploadPartRequest;
 import com.amazonaws.services.s3.model.UploadPartResult;
 import org.apache.druid.java.util.common.HumanReadableBytes;
+import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.apache.druid.query.DruidProcessingConfigTest;
 import org.apache.druid.storage.s3.ServerSideEncryptingAmazonS3;
 import org.apache.druid.utils.RuntimeInfo;
@@ -43,14 +44,16 @@ public class S3UploadManagerTest
   private S3UploadManager s3UploadManager;
   private S3OutputConfig s3OutputConfig;
   private S3ExportConfig s3ExportConfig;
+  private StubServiceEmitter serviceEmitter;
 
   @Before
   public void setUp()
   {
     s3OutputConfig = new S3OutputConfig("bucket", "prefix", EasyMock.mock(File.class), new HumanReadableBytes("100MiB"), 1);
     s3ExportConfig = new S3ExportConfig("tempDir", new HumanReadableBytes("200MiB"), 1, null);
+    serviceEmitter = new StubServiceEmitter();
     final RuntimeInfo runtimeInfo = new DruidProcessingConfigTest.MockRuntimeInfo(8, 0, 0);
-    s3UploadManager = new S3UploadManager(s3OutputConfig, s3ExportConfig, runtimeInfo);
+    s3UploadManager = new S3UploadManager(s3OutputConfig, s3ExportConfig, runtimeInfo, serviceEmitter);
   }
 
   @Test
@@ -75,6 +78,10 @@ public class S3UploadManagerTest
     UploadPartResult futureResult = result.get();
     Assert.assertEquals(chunkId, futureResult.getPartNumber());
     Assert.assertEquals("etag", futureResult.getETag());
+
+    serviceEmitter.verifyEmitted("s3/upload/part/queuedTime", 1);
+    serviceEmitter.verifyEmitted("s3/upload/part/queueSize", 1);
+    serviceEmitter.verifyEmitted("s3/upload/part/time", 1);
   }
 
   @Test
diff --git a/processing/src/test/java/org/apache/druid/java/util/metrics/StubServiceEmitter.java b/processing/src/test/java/org/apache/druid/java/util/metrics/StubServiceEmitter.java
index 2ddba7c6cd8..e4a8b9403dd 100644
--- a/processing/src/test/java/org/apache/druid/java/util/metrics/StubServiceEmitter.java
+++ b/processing/src/test/java/org/apache/druid/java/util/metrics/StubServiceEmitter.java
@@ -26,9 +26,9 @@ import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 
 import java.util.ArrayList;
 import java.util.Collections;
-import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
+import java.util.concurrent.ConcurrentHashMap;
 
 /**
  * Test implementation of {@link ServiceEmitter} that collects emitted metrics
@@ -38,7 +38,7 @@ public class StubServiceEmitter extends ServiceEmitter implements MetricsVerifie
 {
   private final List<Event> events = new ArrayList<>();
   private final List<AlertEvent> alertEvents = new ArrayList<>();
-  private final Map<String, List<ServiceMetricEvent>> metricEvents = new HashMap<>();
+  private final ConcurrentHashMap<String, List<ServiceMetricEvent>> metricEvents = new ConcurrentHashMap<>();
 
   public StubServiceEmitter()
   {

From 4e0ea7823b128cc214df8dc774d370b306b91461 Mon Sep 17 00:00:00 2001
From: Suneet Saldanha <suneet@apache.org>
Date: Fri, 21 Jun 2024 06:01:59 -0700
Subject: [PATCH 06/72] Update docs for K8s TaskRunner Dynamic Config (#16600)

* Update docs for K8s TaskRunner Dynamic Config

* touchups

* code review

* npe

* oopsies
---
 .../extensions-contrib/k8s-jobs.md            | 413 ++++++++++++++++--
 .../execution/PodTemplateSelectStrategy.java  |   6 +-
 ...electorBasedPodTemplateSelectStrategy.java |  23 +-
 .../taskadapter/PodTemplateTaskAdapter.java   |   5 -
 ...KubernetesTaskRunnerDynamicConfigTest.java |   3 +-
 ...torBasedPodTemplateSelectStrategyTest.java |  20 +-
 .../PodTemplateTaskAdapterTest.java           |   2 +-
 7 files changed, 386 insertions(+), 86 deletions(-)

diff --git a/docs/development/extensions-contrib/k8s-jobs.md b/docs/development/extensions-contrib/k8s-jobs.md
index 1d75e2b7efe..082b8735349 100644
--- a/docs/development/extensions-contrib/k8s-jobs.md
+++ b/docs/development/extensions-contrib/k8s-jobs.md
@@ -40,7 +40,280 @@ The extension uses `druid.indexer.runner.capacity` to limit the number of k8s jo
 Other configurations required are:
 `druid.indexer.runner.type: k8s` and `druid.indexer.task.encapsulatedTask: true`
 
-## Pod Adapters
+### Dynamic config
+
+Druid operators can dynamically tune certain features within this extension. You don't need to restart the Overlord
+service for these changes to take effect.
+
+Druid can dynamically tune [pod template selection](#pod-template-selection), which allows you to configure the pod 
+template based on the task to be run. To enable dynamic pod template selection, first configure the 
+[custom template pod adapter](#custom-template-pod-adapter).
+
+Use the following APIs to view and update the dynamic configuration for the Kubernetes task runner.
+
+To use these APIs, ensure you have read and write permissions for the CONFIG resource type with the resource name
+"CONFIG". For more information on permissions, see 
+[User authentication and authorization](../../operations/security-user-auth.md#config).
+
+#### Get dynamic configuration
+
+Retrieves the current dynamic execution config for the Kubernetes task runner. 
+Returns a JSON object with the dynamic configuration properties.
+
+##### URL
+
+`GET` `/druid/indexer/v1/k8s/taskRunner/executionConfig`
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully retrieved dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+##### Sample request
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskRunner/executionConfig"
+```
+</TabItem>
+
+<TabItem value="3" label="HTTP">
+
+```HTTP
+GET /druid/indexer/v1/k8s/taskRunner/executionConfig HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample response
+
+<details>
+<summary>View the response</summary>
+
+```json
+{
+  "type": "default",
+  "podTemplateSelectStrategy":
+  {
+    "type": "selectorBased",
+    "selectors": [
+      {
+        "selectionKey": "podSpec1",
+        "context.tags": {
+          "userProvidedTag": ["tag1", "tag2"]
+        },
+        "dataSource": ["wikipedia"]
+      },
+      {
+        "selectionKey": "podSpec2",
+        "type": ["index_kafka"]
+      }
+    ]
+  }
+}
+```
+</details>
+
+#### Update dynamic configuration
+
+Updates the dynamic configuration for the Kubernetes Task Runner
+
+##### URL
+
+`POST` `/druid/indexer/v1/k8s/taskRunner/executionConfig`
+
+##### Header parameters
+
+The endpoint supports the following optional header parameters to populate the `author` and `comment` fields in the configuration history.
+
+* `X-Druid-Author`
+  * Type: String
+  * Author of the configuration change.
+* `X-Druid-Comment`
+  * Type: String
+  * Description for the update.
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="4" label="200 SUCCESS">
+
+
+*Successfully updated dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+##### Sample request
+
+<Tabs>
+
+<TabItem value="5" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskRunner/executionConfig" \
+--header 'Content-Type: application/json' \
+--data '{
+  "type": "default",
+  "podTemplateSelectStrategy":
+  {
+    "type": "selectorBased",
+    "selectors": [
+      {
+        "selectionKey": "podSpec1",
+        "context.tags":
+        {
+          "userProvidedTag": ["tag1", "tag2"]
+        },
+        "dataSource": ["wikipedia"]
+      },
+      {
+        "selectionKey": "podSpec2",
+        "type": ["index_kafka"]
+      }
+    ]
+  }
+}'
+```
+
+</TabItem>
+<TabItem value="6" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/k8s/taskRunner/executionConfig HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+
+{
+  "type": "default",
+  "podTemplateSelectStrategy":
+  {
+    "type": "selectorBased",
+    "selectors": [
+      {
+        "selectionKey": "podSpec1",
+        "context.tags":
+        {
+          "userProvidedTag": ["tag1", "tag2"]
+        },
+        "dataSource": ["wikipedia"]
+      },
+      {
+        "selectionKey": "podSpec2",
+        "type": ["index_kafka"]
+      }
+    ]
+  }
+}
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+#### Get dynamic configuration history
+
+Retrieves the history of changes to Kubernetes task runner's dynamic execution config over an interval of time. Returns 
+an empty array if there are no history records available.
+
+##### URL
+
+`GET` `/druid/indexer/v1/k8s/taskRunner/executionConfig/history`
+
+##### Query parameters
+
+The endpoint supports the following optional query parameters to filter results.
+
+* `interval`
+  * Type: String
+  * Limit the results to the specified time interval in ISO 8601 format delimited with `/`. For example, `2023-07-13/2023-07-19`. The default interval is one week. You can change this period by setting `druid.audit.manager.auditHistoryMillis` in the `runtime.properties` file for the Coordinator.
+
+* `count`
+  * Type: Integer
+  * Limit the number of results to the last `n` entries.
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully retrieved dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+##### Sample request
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskRunner/executionConfig/history"
+```
+
+</TabItem>
+<TabItem value="3" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/k8s/taskRunner/executionConfig/history HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample response
+
+<details>
+<summary>View the response</summary>
+
+```json
+[
+  {
+    "key": "k8s.taskrunner.config",
+    "type": "k8s.taskrunner.config",
+    "auditInfo": {
+      "author": "",
+      "comment": "",
+      "ip": "127.0.0.1"
+    },
+    "payload": "{\"type\": \"default\",\"podTemplateSelectStrategy\":{\"type\": \"taskType\"}",
+    "auditTime": "2024-06-13T20:59:51.622Z"
+  }
+]
+```
+</details>
+
+## Pod adapters
 The logic defining how the pod template is built for your Kubernetes Job depends on which pod adapter you have specified.
 
 ### Overlord Single Container Pod Adapter/Overlord Multi Container Pod Adapter
@@ -65,7 +338,7 @@ and in your sidecar specs:
 That will not work, because we cannot decipher what your command is, the extension needs to know it explicitly.
 **Even for sidecars like Istio which are dynamically created by the service mesh, this needs to happen.*
 
-Instead do the following:
+Instead, do the following:
 You can keep your Dockerfile the same but you must have a sidecar spec like so:
 ``` container:
         name: foo
@@ -90,13 +363,10 @@ The custom template pod adapter allows you to specify a pod template file per ta
 
 The base pod template must be specified as the runtime property `druid.indexer.runner.k8s.podTemplate.base: /path/to/basePodSpec.yaml`
 
-Task specific pod templates can be specified as the runtime property `druid.indexer.runner.k8s.podTemplate.{taskType}: /path/to/taskSpecificPodSpec.yaml` where {taskType} is the name of the task type i.e `index_parallel`.
+<details>
+<summary>Example Pod Template that uses the regular druid docker image</summary>
 
-If you are trying to use the default image's environment variable parsing feature to set runtime properties, you need to add a extra escape underscore when specifying pod templates.
-e.g. set the environment variable `druid_indexer_runner_k8s_podTemplate_index__parallel` when setting `druid.indxer.runner.k8s.podTemplate.index_parallel`
-
-The following is an example Pod Template that uses the regular druid docker image.
-```
+```yaml
 apiVersion: "v1"
 kind: "PodTemplate"
 template:
@@ -164,6 +434,7 @@ template:
     - emptyDir: {}
       name: deepstorage-volume
 ```
+</details>
 
 The below runtime properties need to be passed to the Job's peon process.
 
@@ -177,6 +448,10 @@ druid.indexer.task.encapsulatedTask=true
 ```
 
 Any runtime property or JVM config used by the peon process can also be passed. E.G. below is a example of a ConfigMap that can be used to generate the `nodetype-config-volume` mount in the above template.
+
+<details>
+<summary>Example ConfigMap</summary>
+
 ```
 kind: ConfigMap
 metadata:
@@ -217,59 +492,112 @@ data:
         druid.peon.mode=remote
         druid.indexer.task.encapsulatedTask=true
 ```
-#### Dynamic Pod Template Selection Config
-The Dynamic Pod Template Selection feature enhances the K8s extension by enabling more flexible and dynamic selection of pod templates based on task properties. This process is governed by the `PodTemplateSelectStrategy`. Below are the two strategies implemented:
+</details>
 
-|Property|Description|Default|
-|--------|-----------|-------|
-|`TaskTypePodTemplateSelectStrategy`| This strategy selects pod templates based on task type for execution purposes, implementing the behavior that maps templates to specific task types. | true |
-|`SelectorBasedPodTemplateSelectStrategy`| This strategy evaluates a series of selectors, known as `selectors`, which are aligned with potential task properties. | false |
+#### Pod template selection
+ 
+The pod template adapter can select which pod template should be used for a task using the [task runner execution config](#dynamic-config)
 
-`SelectorBasedPodTemplateSelectStrategy`, the strategy implementing this new feature, is based on conditional `selectors` that match against top-level keys from the task payload. Currently, it supports matching based on task context tags, task type, and dataSource. These selectors are ordered in the dynamic configuration, with the first selector given the highest priority during the evaluation process. This means that the selection process uses these ordered conditions to determine a task’s Pod template. The first matching condition immediately determines the Pod template, thereby prioritizing certain configurations over others. If no selector matches, it will fall back to an optional `defaultKey` if configured; if there is still no match, it will use the `base` template.
+##### Select based on task type
 
-Example Configuration:
+The `TaskTypePodTemplateSelectStrategy` strategy selects pod templates based on task type for execution purposes,
+implementing the behavior that maps templates to specific task types. This is the default pod template selection
+strategy. To explicitly select this strategy, set the `podTemplateSelectStrategy` in the dynamic execution config to
 
-We define two template keys in the configuration—`low-throughput` and `medium-throughput`—each associated with specific task conditions and arranged in a priority order.
-
-- Low Throughput Template: This is the first template evaluated and has the highest priority. Tasks that have a context tag `billingCategory=streaming_ingestion` and a datasource of `wikipedia` will be classified under the `low-throughput` template. This classification directs such tasks to utilize a predefined pod template optimized for low throughput requirements.
-
-- Medium Throughput Template: If a task does not meet the low-throughput criteria, the system will then evaluate it against the next selector in order. In this example, if the task type is index_kafka, it will fall into the `medium-throughput` template.
+```json
+{ "type": "default" }
 ```
+
+Task specific pod templates can be specified as the runtime property 
+`druid.indexer.runner.k8s.podTemplate.{taskType}: /path/to/taskSpecificPodSpec.yaml` where {taskType} is the name of the
+task type. For example, `index_parallel`.
+
+If you are trying to use the default image's environment variable parsing feature to set runtime properties, you need to add a extra escape underscore when specifying pod templates.
+For example, set the environment variable `druid_indexer_runner_k8s_podTemplate_index__kafka` when you set the runtime property `druid.indexer.runner.k8s.podTemplate.index_kafka`
+
+
+The following example shows a configuration for task-based pod template selection:
+
+```properties
+druid.indexer.runner.k8s.podTemplate.base=/path/to/basePodSpec.yaml
+druid.indexer.runner.k8s.podTemplate.index_kafka=/path/to/kafkaPodSpec.yaml
+```
+
+##### Select based on one or more conditions
+
+The `SelectorBasedPodTemplateSelectStrategy` strategy evaluates a series of criteria within `selectors` to determine
+which pod template to use to run the task. Pod  templates are configured in the runtime properties like
+`druid.indexer.runner.k8s.podTemplate.<selectionKey>=...`.
+
+```json
+{
+  "type": "selectorBased",
+  "selectors": [
+    {
+      "selectionKey": "podSpec1", 
+      "context.tags":
+      {
+        "userProvidedTag": ["tag1", "tag2"]
+      },
+      "dataSource": ["wikipedia"]
+    },
+    {
+      "selectionKey": "podSpec2",
+      "type": ["index_kafka"]
+    }
+  ]
+}
+```
+
+Selectors are processed in order. Druid selects the template based on the first matching selector. If a  task does not
+match any selector in the list, it will use the `base` pod template.
+
+For a task to match a selector, all the conditions within the selector must match. A selector can match on
+- `type`: Type of the task
+- `dataSource`: Destination datasource of the task.
+- `context.tags`: Tags passed in the task's context.
+
+##### Example
+
+Set the following runtime properties to define the pod specs that can be used by Druid.
+
+```properties
+druid.indexer.runner.k8s.podTemplate.base=/path/to/basePodSpec.yaml
+druid.indexer.runner.k8s.podTemplate.podSpec1=/path/to/podSpecWithHighMemRequests.yaml
+druid.indexer.runner.k8s.podTemplate.podSpec2=/path/to/podSpecWithLowCpuRequests.yaml
+```
+
+Set the dynamic execution config to define the pod template selection strategy.
+
+```json
 {
   "type": "default",
-  "podTemplateSelectStrategy":
-  {
+  "podTemplateSelectStrategy": {
     "type": "selectorBased",
     "selectors": [
       {
-        "selectionKey": "low-throughput",
-        "context.tags":
-        {
-          "billingCategory": ["streaming_ingestion"]
-        },
+        "selectionKey": "podSpec1",
+        "context.tags": { "userProvidedTag": ["tag1", "tag2"] },
         "dataSource": ["wikipedia"]
       },
       {
-        "selectionKey": "medium-throughput",
+        "selectionKey": "podSpec2",
         "type": ["index_kafka"]
       }
-    ],
-    "defaultKey"" "base"
+    ]
   }
 }
 ```
-Task specific pod templates can be specified as the runtime property `druid.indexer.runner.k8s.podTemplate.{template}: /path/to/taskSpecificPodSpec.yaml` where {template} is the matched `selectionKey` of the `podTemplateSelectStrategy` i.e low-throughput.
 
-Similar to Overlord dynamic configuration, the following API endpoints are defined to retrieve and manage dynamic configurations of Pod Template Selection config:
+Druid selects the pod templates as follows: 
+1. Use `podSpecWithHighMemRequests.yaml` when both of the following conditions are met:
+   1. The task context contains a tag with the key `userProvidedTag` that has the value `tag1` or `tag2`.
+   2. The task targets the `wikipedia` datasource.
+2. Use `podSpecWithLowCpuRequests.yaml` when the task type is `index_kafka`.
+3. Use the `basePodSpec.yaml` for all other tasks.
 
-- Get dynamic configuration:
-`POST` `/druid/indexer/v1/k8s/taskRunner/executionConfig`
-
-- Update dynamic configuration:
-`GET` `/druid/indexer/v1/k8s/taskRunner/executionConfig`
-
-- Get dynamic configuration history:
-`GET` `/druid/indexer/v1/k8s/taskRunner/executionConfig/history`
+In this example, if there is an `index_kafka` task for the `wikipedia` datasource with the tag `userProvidedTag: tag1`,
+Druid selects the pod template `podSpecWithHighMemRequests.yaml`.
 
 ### Properties
 |Property| Possible Values | Description                                                                                                                                                                                                                                      |Default|required|
@@ -302,7 +630,8 @@ Similar to Overlord dynamic configuration, the following API endpoints are defin
 - All Druid Pods belonging to one Druid cluster must be inside the same Kubernetes namespace.
 
 - You must have a role binding for the overlord's service account that provides the needed permissions for interacting with Kubernetes. An example spec could be:
-```
+
+```yaml
 kind: Role
 apiVersion: rbac.authorization.k8s.io/v1
 metadata:
diff --git a/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/execution/PodTemplateSelectStrategy.java b/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/execution/PodTemplateSelectStrategy.java
index 1b8d57419d2..ae7869707fc 100644
--- a/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/execution/PodTemplateSelectStrategy.java
+++ b/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/execution/PodTemplateSelectStrategy.java
@@ -24,6 +24,7 @@ import com.fasterxml.jackson.annotation.JsonTypeInfo;
 import io.fabric8.kubernetes.api.model.PodTemplate;
 import org.apache.druid.indexing.common.task.Task;
 
+import javax.validation.constraints.NotNull;
 import java.util.Map;
 
 /**
@@ -41,8 +42,7 @@ public interface PodTemplateSelectStrategy
    * allows for customized resource allocation and management tailored to the task's specific requirements.
    *
    * @param task The task for which the Pod template is determined.
-   * @return The selected Pod template. If no matching template is found,
-   *         the method falls back to a base template.
+   * @return The pod template that should be used to run the task.
    */
-  PodTemplate getPodTemplateForTask(Task task, Map<String, PodTemplate> templates);
+  @NotNull PodTemplate getPodTemplateForTask(Task task, Map<String, PodTemplate> templates);
 }
diff --git a/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/execution/SelectorBasedPodTemplateSelectStrategy.java b/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/execution/SelectorBasedPodTemplateSelectStrategy.java
index 938ed04e6a6..4c2d01b5218 100644
--- a/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/execution/SelectorBasedPodTemplateSelectStrategy.java
+++ b/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/execution/SelectorBasedPodTemplateSelectStrategy.java
@@ -25,7 +25,6 @@ import com.google.common.base.Preconditions;
 import io.fabric8.kubernetes.api.model.PodTemplate;
 import org.apache.druid.indexing.common.task.Task;
 
-import javax.annotation.Nullable;
 import java.util.List;
 import java.util.Map;
 import java.util.Objects;
@@ -36,19 +35,15 @@ import java.util.Objects;
  */
 public class SelectorBasedPodTemplateSelectStrategy implements PodTemplateSelectStrategy
 {
-  @Nullable
-  private String defaultKey;
-  private List<Selector> selectors;
+  private final List<Selector> selectors;
 
   @JsonCreator
   public SelectorBasedPodTemplateSelectStrategy(
-      @JsonProperty("selectors") List<Selector> selectors,
-      @JsonProperty("defaultKey") @Nullable String defaultKey
+      @JsonProperty("selectors") List<Selector> selectors
   )
   {
     Preconditions.checkNotNull(selectors, "selectors");
     this.selectors = selectors;
-    this.defaultKey = defaultKey;
   }
 
   /**
@@ -64,7 +59,7 @@ public class SelectorBasedPodTemplateSelectStrategy implements PodTemplateSelect
                                   .filter(selector -> selector.evaluate(task))
                                   .findFirst()
                                   .map(Selector::getSelectionKey)
-                                  .orElse(defaultKey);
+                                  .orElse("base");
 
     return templates.getOrDefault(templateKey, templates.get("base"));
   }
@@ -75,13 +70,6 @@ public class SelectorBasedPodTemplateSelectStrategy implements PodTemplateSelect
     return selectors;
   }
 
-  @Nullable
-  @JsonProperty
-  public String getDefaultKey()
-  {
-    return defaultKey;
-  }
-
   @Override
   public boolean equals(Object o)
   {
@@ -92,13 +80,13 @@ public class SelectorBasedPodTemplateSelectStrategy implements PodTemplateSelect
       return false;
     }
     SelectorBasedPodTemplateSelectStrategy that = (SelectorBasedPodTemplateSelectStrategy) o;
-    return Objects.equals(defaultKey, that.defaultKey) && Objects.equals(selectors, that.selectors);
+    return Objects.equals(selectors, that.selectors);
   }
 
   @Override
   public int hashCode()
   {
-    return Objects.hash(defaultKey, selectors);
+    return Objects.hash(selectors);
   }
 
   @Override
@@ -106,7 +94,6 @@ public class SelectorBasedPodTemplateSelectStrategy implements PodTemplateSelect
   {
     return "SelectorBasedPodTemplateSelectStrategy{" +
            "selectors=" + selectors +
-           ", defaultKey=" + defaultKey +
            '}';
   }
 }
diff --git a/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/taskadapter/PodTemplateTaskAdapter.java b/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/taskadapter/PodTemplateTaskAdapter.java
index 8e3788e31e1..19cc788b3ee 100644
--- a/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/taskadapter/PodTemplateTaskAdapter.java
+++ b/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/taskadapter/PodTemplateTaskAdapter.java
@@ -39,7 +39,6 @@ import org.apache.druid.guice.IndexingServiceModuleHelper;
 import org.apache.druid.indexing.common.config.TaskConfig;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.java.util.common.IAE;
-import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.k8s.overlord.KubernetesTaskRunnerConfig;
@@ -141,10 +140,6 @@ public class PodTemplateTaskAdapter implements TaskAdapter
 
     PodTemplate podTemplate = podTemplateSelectStrategy.getPodTemplateForTask(task, templates);
 
-    if (podTemplate == null) {
-      throw new ISE("Pod template spec not found for task type [%s]", task.getType());
-    }
-
     return new JobBuilder()
         .withNewMetadata()
         .withName(new K8sTaskId(task).getK8sJobName())
diff --git a/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/execution/KubernetesTaskRunnerDynamicConfigTest.java b/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/execution/KubernetesTaskRunnerDynamicConfigTest.java
index 6236794d366..77a819dde9c 100644
--- a/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/execution/KubernetesTaskRunnerDynamicConfigTest.java
+++ b/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/execution/KubernetesTaskRunnerDynamicConfigTest.java
@@ -64,8 +64,7 @@ public class KubernetesTaskRunnerDynamicConfigTest
            + "        \"selectionKey\": \"medium-throughput\",\n"
            + "        \"type\": [\"index_kafka\"]\n"
            + "      }\n"
-           + "    ],\n"
-           + "    \"defaultKey\": \"base\"\n"
+           + "    ]\n"
            + "  }\n"
            + "}";
 
diff --git a/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/execution/SelectorBasedPodTemplateSelectStrategyTest.java b/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/execution/SelectorBasedPodTemplateSelectStrategyTest.java
index 9aa1376a515..a82bb076855 100644
--- a/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/execution/SelectorBasedPodTemplateSelectStrategyTest.java
+++ b/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/execution/SelectorBasedPodTemplateSelectStrategyTest.java
@@ -88,14 +88,14 @@ public class SelectorBasedPodTemplateSelectStrategyTest
   @Test(expected = NullPointerException.class)
   public void shouldThrowNullPointerExceptionWhenSelectorsAreNull()
   {
-    new SelectorBasedPodTemplateSelectStrategy(null, null);
+    new SelectorBasedPodTemplateSelectStrategy(null);
   }
 
   @Test
   public void testGetPodTemplate_ForTask_emptySelectorsFallbackToBaseTemplate()
   {
     List<Selector> emptySelectors = Collections.emptyList();
-    SelectorBasedPodTemplateSelectStrategy strategy = new SelectorBasedPodTemplateSelectStrategy(emptySelectors, null);
+    SelectorBasedPodTemplateSelectStrategy strategy = new SelectorBasedPodTemplateSelectStrategy(emptySelectors);
     Task task = NoopTask.create();
     Assert.assertEquals("base", strategy.getPodTemplateForTask(task, templates).getMetadata().getName());
   }
@@ -105,21 +105,11 @@ public class SelectorBasedPodTemplateSelectStrategyTest
   {
     Selector noMatchSelector = new MockSelector(false, "mock");
     List<Selector> selectors = Collections.singletonList(noMatchSelector);
-    SelectorBasedPodTemplateSelectStrategy strategy = new SelectorBasedPodTemplateSelectStrategy(selectors, null);
+    SelectorBasedPodTemplateSelectStrategy strategy = new SelectorBasedPodTemplateSelectStrategy(selectors);
     Task task = NoopTask.create();
     Assert.assertEquals("base", strategy.getPodTemplateForTask(task, templates).getMetadata().getName());
   }
 
-  @Test
-  public void testGetPodTemplate_ForTask_noMatchSelectorsFallbackToDefaultKeyTemplate()
-  {
-    Selector noMatchSelector = new MockSelector(false, "mock");
-    List<Selector> selectors = Collections.singletonList(noMatchSelector);
-    SelectorBasedPodTemplateSelectStrategy strategy = new SelectorBasedPodTemplateSelectStrategy(selectors, "match");
-    Task task = NoopTask.create();
-    Assert.assertEquals("match", strategy.getPodTemplateForTask(task, templates).getMetadata().getName());
-  }
-
   @Test
   public void testGetPodTemplate_ForTask_withMatchSelectors()
   {
@@ -132,7 +122,7 @@ public class SelectorBasedPodTemplateSelectStrategyTest
         noMatchSelector,
         matchSelector
     );
-    SelectorBasedPodTemplateSelectStrategy strategy = new SelectorBasedPodTemplateSelectStrategy(selectors, null);
+    SelectorBasedPodTemplateSelectStrategy strategy = new SelectorBasedPodTemplateSelectStrategy(selectors);
     Task task = NoopTask.create();
     Assert.assertEquals("match", strategy.getPodTemplateForTask(task, templates).getMetadata().getName());
   }
@@ -152,7 +142,7 @@ public class SelectorBasedPodTemplateSelectStrategyTest
     );
 
     SelectorBasedPodTemplateSelectStrategy strategy = new SelectorBasedPodTemplateSelectStrategy(
-        Collections.singletonList(selector), "default");
+        Collections.singletonList(selector));
 
     SelectorBasedPodTemplateSelectStrategy strategy2 = objectMapper.readValue(
         objectMapper.writeValueAsBytes(strategy),
diff --git a/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/taskadapter/PodTemplateTaskAdapterTest.java b/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/taskadapter/PodTemplateTaskAdapterTest.java
index 36fc77631a1..4aad419007e 100644
--- a/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/taskadapter/PodTemplateTaskAdapterTest.java
+++ b/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/taskadapter/PodTemplateTaskAdapterTest.java
@@ -620,7 +620,7 @@ public class PodTemplateTaskAdapterTest
     dynamicConfigRef = () -> new DefaultKubernetesTaskRunnerDynamicConfig(new SelectorBasedPodTemplateSelectStrategy(
         Collections.singletonList(
             new Selector("lowThrougput", null, null, Sets.newSet(dataSource)
-            )), null));
+            ))));
 
     PodTemplateTaskAdapter adapter = new PodTemplateTaskAdapter(
         taskRunnerConfig,

From 4eced9b3c99ea818ecef15631662de6f274e70cc Mon Sep 17 00:00:00 2001
From: Rishabh Singh <6513075+findingrish@users.noreply.github.com>
Date: Sat, 22 Jun 2024 04:10:12 +0530
Subject: [PATCH 07/72] Fix CentralizedDatasourceSchema group IT failure 
 (#16636)

* Fix build

* Update datasource name in ITSystemTableBatchIndexTaskTest
---
 .../druid/tests/indexer/ITSystemTableBatchIndexTaskTest.java  | 2 +-
 .../resources/indexer/sys_segment_batch_index_queries.json    | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITSystemTableBatchIndexTaskTest.java b/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITSystemTableBatchIndexTaskTest.java
index f15081509a0..f98626ad9b5 100644
--- a/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITSystemTableBatchIndexTaskTest.java
+++ b/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITSystemTableBatchIndexTaskTest.java
@@ -37,7 +37,7 @@ public class ITSystemTableBatchIndexTaskTest extends AbstractITBatchIndexTest
   private static final Logger LOG = new Logger(ITSystemTableBatchIndexTaskTest.class);
   private static final String INDEX_TASK = "/indexer/wikipedia_index_task.json";
   private static final String SYSTEM_QUERIES_RESOURCE = "/indexer/sys_segment_batch_index_queries.json";
-  private static final String INDEX_DATASOURCE = "wikipedia_index_test";
+  private static final String INDEX_DATASOURCE = "sys_segment_wikipedia_index_test";
 
   @Test
   public void testIndexData() throws Exception
diff --git a/integration-tests/src/test/resources/indexer/sys_segment_batch_index_queries.json b/integration-tests/src/test/resources/indexer/sys_segment_batch_index_queries.json
index 931ad895778..b0746e0cab4 100644
--- a/integration-tests/src/test/resources/indexer/sys_segment_batch_index_queries.json
+++ b/integration-tests/src/test/resources/indexer/sys_segment_batch_index_queries.json
@@ -1,7 +1,7 @@
 [
   {
     "query": {
-      "query": "SELECT count(*) FROM sys.segments WHERE datasource LIKE 'wikipedia_index_test%'"
+      "query": "SELECT count(*) FROM sys.segments WHERE datasource LIKE 'sys_segment_wikipedia_index_test%'"
     },
     "expectedResults": [
       {
@@ -24,7 +24,7 @@
   },
   {
     "query": {
-      "query": "SELECT status AS status FROM sys.tasks WHERE datasource LIKE 'wikipedia_index_test%' GROUP BY 1"
+      "query": "SELECT status AS status FROM sys.tasks WHERE datasource LIKE 'sys_segment_wikipedia_index_test%' GROUP BY 1"
     },
     "expectedResults": [
       {

From 51c73b5a4e3e5743986cf3f24401e8cd14b8169a Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Fri, 21 Jun 2024 18:33:15 -0700
Subject: [PATCH 08/72] Web console: show formatted JSON value (#16632)

* show formatted json value

* update snapshot

* window functions

* count star can also have a window

* better edit query context
---
 licenses.yaml                                 |   2 +-
 web-console/lib/keywords.js                   |   3 +
 web-console/package-lock.json                 |  14 +--
 web-console/package.json                      |   2 +-
 .../record-table-pane/record-table-pane.tsx   |   4 +-
 .../edit-context-dialog.spec.tsx.snap         | 102 ++++++++++++++++--
 .../edit-context-dialog.scss                  |  21 +---
 .../edit-context-dialog.spec.tsx              |   6 +-
 .../edit-context-dialog.tsx                   | 102 ++++++++----------
 .../show-value-dialog.spec.tsx.snap           |  90 +++++++++-------
 .../show-value-dialog/show-value-dialog.scss  |  23 ++--
 .../show-value-dialog/show-value-dialog.tsx   |  62 +++++++++--
 .../string-menu-items/string-menu-items.tsx   |   2 +-
 .../result-table-pane/result-table-pane.tsx   |   4 +-
 .../workbench-view/run-panel/run-panel.tsx    |   2 +-
 15 files changed, 282 insertions(+), 157 deletions(-)

diff --git a/licenses.yaml b/licenses.yaml
index 3c1f7b0b2d4..700dc891553 100644
--- a/licenses.yaml
+++ b/licenses.yaml
@@ -5094,7 +5094,7 @@ license_category: binary
 module: web-console
 license_name: Apache License version 2.0
 copyright: Imply Data
-version: 0.22.15
+version: 0.22.20
 
 ---
 
diff --git a/web-console/lib/keywords.js b/web-console/lib/keywords.js
index bf7b9a03910..dbf10e12bac 100644
--- a/web-console/lib/keywords.js
+++ b/web-console/lib/keywords.js
@@ -47,6 +47,7 @@ exports.SQL_KEYWORDS = [
   'FULL',
   'CROSS',
   'USING',
+  'NATURAL',
   'FETCH',
   'FIRST',
   'NEXT',
@@ -67,6 +68,8 @@ exports.SQL_KEYWORDS = [
   'RANGE',
   'PRECEDING',
   'FOLLOWING',
+  'CURRENT',
+  'UNBOUNDED',
   'EXTEND',
   'PIVOT',
   'UNPIVOT',
diff --git a/web-console/package-lock.json b/web-console/package-lock.json
index 26999644f1e..2945955d9d6 100644
--- a/web-console/package-lock.json
+++ b/web-console/package-lock.json
@@ -15,7 +15,7 @@
         "@blueprintjs/icons": "^4.16.0",
         "@blueprintjs/popover2": "^1.14.9",
         "@blueprintjs/select": "^4.9.24",
-        "@druid-toolkit/query": "^0.22.15",
+        "@druid-toolkit/query": "^0.22.20",
         "@druid-toolkit/visuals-core": "^0.3.3",
         "@druid-toolkit/visuals-react": "^0.3.3",
         "ace-builds": "~1.4.14",
@@ -1005,9 +1005,9 @@
       }
     },
     "node_modules/@druid-toolkit/query": {
-      "version": "0.22.15",
-      "resolved": "https://registry.npmjs.org/@druid-toolkit/query/-/query-0.22.15.tgz",
-      "integrity": "sha512-LyQVIVkVNhduscf2wnBO/oGBvj353tS5ElIws20xQzApvEIwNNxmlkA+8npqwy77BkJj3nRQvlenbSEDHQdqow==",
+      "version": "0.22.20",
+      "resolved": "https://registry.npmjs.org/@druid-toolkit/query/-/query-0.22.20.tgz",
+      "integrity": "sha512-GmmSd27y7zLVTjgTBQy+XoGeSSGhSDNmwyiwWtSua7I5LX8XqHV7Chi8HIH25YQoVgTK1pLK4RS8eRXxthRAzg==",
       "dependencies": {
         "tslib": "^2.5.2"
       }
@@ -19147,9 +19147,9 @@
       "dev": true
     },
     "@druid-toolkit/query": {
-      "version": "0.22.15",
-      "resolved": "https://registry.npmjs.org/@druid-toolkit/query/-/query-0.22.15.tgz",
-      "integrity": "sha512-LyQVIVkVNhduscf2wnBO/oGBvj353tS5ElIws20xQzApvEIwNNxmlkA+8npqwy77BkJj3nRQvlenbSEDHQdqow==",
+      "version": "0.22.20",
+      "resolved": "https://registry.npmjs.org/@druid-toolkit/query/-/query-0.22.20.tgz",
+      "integrity": "sha512-GmmSd27y7zLVTjgTBQy+XoGeSSGhSDNmwyiwWtSua7I5LX8XqHV7Chi8HIH25YQoVgTK1pLK4RS8eRXxthRAzg==",
       "requires": {
         "tslib": "^2.5.2"
       }
diff --git a/web-console/package.json b/web-console/package.json
index 44e6986c2bd..6e38ba24684 100644
--- a/web-console/package.json
+++ b/web-console/package.json
@@ -69,7 +69,7 @@
     "@blueprintjs/icons": "^4.16.0",
     "@blueprintjs/popover2": "^1.14.9",
     "@blueprintjs/select": "^4.9.24",
-    "@druid-toolkit/query": "^0.22.15",
+    "@druid-toolkit/query": "^0.22.20",
     "@druid-toolkit/visuals-core": "^0.3.3",
     "@druid-toolkit/visuals-react": "^0.3.3",
     "ace-builds": "~1.4.14",
diff --git a/web-console/src/components/record-table-pane/record-table-pane.tsx b/web-console/src/components/record-table-pane/record-table-pane.tsx
index 29433b25ddc..6007559fb0d 100644
--- a/web-console/src/components/record-table-pane/record-table-pane.tsx
+++ b/web-console/src/components/record-table-pane/record-table-pane.tsx
@@ -174,7 +174,9 @@ export const RecordTablePane = React.memo(function RecordTablePane(props: Record
           })}
         />
       )}
-      {showValue && <ShowValueDialog onClose={() => setShowValue(undefined)} str={showValue} />}
+      {showValue && (
+        <ShowValueDialog onClose={() => setShowValue(undefined)} str={showValue} size="large" />
+      )}
     </div>
   );
 });
diff --git a/web-console/src/dialogs/edit-context-dialog/__snapshots__/edit-context-dialog.spec.tsx.snap b/web-console/src/dialogs/edit-context-dialog/__snapshots__/edit-context-dialog.spec.tsx.snap
index b9e2d072ea9..7a2ed054f3a 100644
--- a/web-console/src/dialogs/edit-context-dialog/__snapshots__/edit-context-dialog.spec.tsx.snap
+++ b/web-console/src/dialogs/edit-context-dialog/__snapshots__/edit-context-dialog.spec.tsx.snap
@@ -57,18 +57,102 @@ exports[`EditContextDialog matches snapshot 1`] = `
             </span>
           </button>
         </div>
-        <textarea
-          class="bp4-input"
-        >
-          {
-
-}
-        </textarea>
         <div
-          class="bp4-dialog-footer-actions"
+          class=" ace_editor ace_hidpi ace-solarized-dark ace_dark query-string"
+          id="ace-editor"
+          style="width: 100%; height: 100%; font-size: 12px;"
+        >
+          <textarea
+            autocapitalize="off"
+            autocorrect="off"
+            class="ace_text-input"
+            spellcheck="false"
+            style="opacity: 0; font-size: 1px;"
+            wrap="off"
+          />
+          <div
+            aria-hidden="true"
+            class="ace_gutter"
+          >
+            <div
+              class="ace_layer ace_gutter-layer ace_folding-enabled"
+              style="height: 1000000px;"
+            />
+          </div>
+          <div
+            class="ace_scroller"
+            style="line-height: 0px;"
+          >
+            <div
+              class="ace_content"
+            >
+              <div
+                class="ace_layer ace_print-margin-layer"
+              >
+                <div
+                  class="ace_print-margin"
+                  style="left: 4px; visibility: hidden;"
+                />
+              </div>
+              <div
+                class="ace_layer ace_marker-layer"
+              />
+              <div
+                class="ace_layer ace_text-layer"
+                style="height: 1000000px; margin: 0px 4px;"
+              />
+              <div
+                class="ace_layer ace_marker-layer"
+              />
+              <div
+                class="ace_layer ace_cursor-layer ace_hidden-cursors"
+              >
+                <div
+                  class="ace_cursor"
+                />
+              </div>
+            </div>
+          </div>
+          <div
+            class="ace_scrollbar ace_scrollbar-v"
+            style="display: none; width: 20px;"
+          >
+            <div
+              class="ace_scrollbar-inner"
+              style="width: 20px;"
+            >
+               
+            </div>
+          </div>
+          <div
+            class="ace_scrollbar ace_scrollbar-h"
+            style="display: none; height: 20px;"
+          >
+            <div
+              class="ace_scrollbar-inner"
+              style="height: 20px;"
+            >
+               
+            </div>
+          </div>
+          <div
+            style="height: auto; width: auto; top: 0px; left: 0px; visibility: hidden; position: absolute; white-space: pre; overflow: hidden;"
+          >
+            <div
+              style="height: auto; width: auto; top: 0px; left: 0px; visibility: hidden; position: absolute; white-space: pre; overflow: visible;"
+            />
+            <div
+              style="height: auto; width: auto; top: 0px; left: 0px; visibility: hidden; position: absolute; white-space: pre; overflow: visible;"
+            >
+              XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX
+            </div>
+          </div>
+        </div>
+        <div
+          class="bp4-dialog-footer"
         >
           <div
-            class="edit-context-dialog-buttons"
+            class="bp4-dialog-footer-actions"
           >
             <button
               class="bp4-button"
diff --git a/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.scss b/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.scss
index 4cc5ab33b7f..5e3a47a9593 100644
--- a/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.scss
+++ b/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.scss
@@ -20,25 +20,6 @@
 
 .edit-context-dialog {
   &.#{$bp-ns}-dialog {
-    padding-bottom: 10px;
-  }
-
-  .#{$bp-ns}-input {
-    margin: 10px;
-    height: 400px;
-  }
-
-  .#{$bp-ns}-dialog-footer-actions {
-    padding: 0px 10px 0px 10px;
-    display: grid;
-    grid-template-columns: 340px 1fr;
-    grid-template-areas: 'error buttons';
-  }
-
-  .edit-context-dialog-error {
-    grid-area: error;
-  }
-  .edit-context-dialog-buttons {
-    grid-area: buttons;
+    height: 60vh;
   }
 }
diff --git a/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.spec.tsx b/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.spec.tsx
index 7052dfa5422..272596ae0df 100644
--- a/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.spec.tsx
+++ b/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.spec.tsx
@@ -24,7 +24,11 @@ import { EditContextDialog } from './edit-context-dialog';
 describe('EditContextDialog', () => {
   it('matches snapshot', () => {
     const compactionDialog = (
-      <EditContextDialog queryContext={{}} onQueryContextChange={() => null} onClose={() => {}} />
+      <EditContextDialog
+        initQueryContext={{}}
+        onQueryContextChange={() => null}
+        onClose={() => {}}
+      />
     );
     render(compactionDialog);
     expect(document.body.lastChild).toMatchSnapshot();
diff --git a/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.tsx b/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.tsx
index 3632606508e..4ba85b000ee 100644
--- a/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.tsx
+++ b/web-console/src/dialogs/edit-context-dialog/edit-context-dialog.tsx
@@ -16,86 +16,72 @@
  * limitations under the License.
  */
 
-import { Button, Callout, Classes, Dialog, Intent, TextArea } from '@blueprintjs/core';
+import { Button, Classes, Dialog, Intent } from '@blueprintjs/core';
 import Hjson from 'hjson';
 import * as JSONBig from 'json-bigint-native';
 import React, { useState } from 'react';
+import AceEditor from 'react-ace';
 
 import type { QueryContext } from '../../druid-models';
+import { AppToaster } from '../../singletons';
 
 import './edit-context-dialog.scss';
 
-export interface EditContextDialogProps {
-  queryContext: QueryContext;
-  onQueryContextChange: (queryContext: QueryContext) => void;
-  onClose: () => void;
+function formatContext(context: QueryContext | undefined): string {
+  const str = JSONBig.stringify(context || {}, undefined, 2);
+  return str === '{}' ? '{\n\n}' : str;
 }
 
-export interface EditContextDialogState {
-  queryContextString: string;
-  queryContext?: QueryContext;
-  error?: string;
+export interface EditContextDialogProps {
+  initQueryContext: QueryContext | undefined;
+  onQueryContextChange(queryContext: QueryContext): void;
+  onClose(): void;
 }
 
 export const EditContextDialog = React.memo(function EditContextDialog(
   props: EditContextDialogProps,
 ) {
-  const { onQueryContextChange, onClose } = props;
-  const [state, setState] = useState<EditContextDialogState>(() => ({
-    queryContext: props.queryContext,
-    queryContextString: Object.keys(props.queryContext).length
-      ? JSONBig.stringify(props.queryContext, undefined, 2)
-      : '{\n\n}',
-  }));
-
-  const { queryContext, queryContextString, error } = state;
-
-  function handleTextChange(e: any) {
-    const queryContextString = (e.target as HTMLInputElement).value;
-
-    let error: string | undefined;
-    let queryContext: QueryContext | undefined;
-    try {
-      queryContext = Hjson.parse(queryContextString);
-    } catch (e) {
-      error = e.message;
-    }
-
-    if (!error && (!queryContext || typeof queryContext !== 'object')) {
-      error = 'Input is not a valid object';
-      queryContext = undefined;
-    }
-
-    setState({
-      queryContextString,
-      queryContext,
-      error,
-    });
-  }
+  const { initQueryContext, onQueryContextChange, onClose } = props;
+  const [queryContextString, setQueryContextString] = useState<string>(
+    formatContext(initQueryContext),
+  );
 
   return (
     <Dialog className="edit-context-dialog" isOpen onClose={onClose} title="Edit query context">
-      <TextArea value={queryContextString} onChange={handleTextChange} autoFocus />
-      <div className={Classes.DIALOG_FOOTER_ACTIONS}>
-        {error && (
-          <Callout intent={Intent.DANGER} className="edit-context-dialog-error">
-            {error}
-          </Callout>
-        )}
-        <div className="edit-context-dialog-buttons">
+      <AceEditor
+        mode="hjson"
+        theme="solarized_dark"
+        className="query-string"
+        name="ace-editor"
+        fontSize={12}
+        width="100%"
+        height="100%"
+        showGutter
+        showPrintMargin={false}
+        value={queryContextString}
+        onChange={v => setQueryContextString(v)}
+      />
+      <div className={Classes.DIALOG_FOOTER}>
+        <div className={Classes.DIALOG_FOOTER_ACTIONS}>
           <Button text="Close" onClick={onClose} />
           <Button
             text="Save"
             intent={Intent.PRIMARY}
-            disabled={Boolean(error)}
-            onClick={
-              queryContext
-                ? () => {
-                    onQueryContextChange(queryContext);
-                    onClose();
-                  }
-                : undefined
-            }
+            onClick={() => {
+              let queryContext: QueryContext;
+              try {
+                queryContext = Hjson.parse(queryContextString);
+              } catch (e) {
+                AppToaster.show({
+                  message: e.message,
+                  intent: Intent.DANGER,
+                });
+                return;
+              }
+
+              onQueryContextChange(queryContext);
+              onClose();
+            }}
           />
         </div>
       </div>
diff --git a/web-console/src/dialogs/show-value-dialog/__snapshots__/show-value-dialog.spec.tsx.snap b/web-console/src/dialogs/show-value-dialog/__snapshots__/show-value-dialog.spec.tsx.snap
index 001312a0b8f..391fe3e018e 100644
--- a/web-console/src/dialogs/show-value-dialog/__snapshots__/show-value-dialog.spec.tsx.snap
+++ b/web-console/src/dialogs/show-value-dialog/__snapshots__/show-value-dialog.spec.tsx.snap
@@ -57,53 +57,61 @@ exports[`ShowValueDialog matches snapshot 1`] = `
             </span>
           </button>
         </div>
-        <textarea
-          class="bp4-input"
-          spellcheck="false"
-        >
-          Bot: Automatska zamjena teksta  (-[[Administrativna podjela Meksika|Admin]] +[[Administrativna podjela Meksika|Admi]])
-        </textarea>
         <div
-          class="bp4-dialog-footer-actions"
+          class="bp4-dialog-body"
         >
-          <button
-            class="bp4-button"
-            type="button"
+          <textarea
+            class="bp4-input"
+            spellcheck="false"
           >
-            <span
-              aria-hidden="true"
-              class="bp4-icon bp4-icon-duplicate"
-              icon="duplicate"
+            Bot: Automatska zamjena teksta  (-[[Administrativna podjela Meksika|Admin]] +[[Administrativna podjela Meksika|Admi]])
+          </textarea>
+        </div>
+        <div
+          class="bp4-dialog-footer"
+        >
+          <div
+            class="bp4-dialog-footer-actions"
+          >
+            <button
+              class="bp4-button"
+              type="button"
             >
-              <svg
-                data-icon="duplicate"
-                height="16"
-                role="img"
-                viewBox="0 0 16 16"
-                width="16"
+              <span
+                aria-hidden="true"
+                class="bp4-icon bp4-icon-duplicate"
+                icon="duplicate"
               >
-                <path
-                  d="M15 0H5c-.55 0-1 .45-1 1v2h2V2h8v7h-1v2h2c.55 0 1-.45 1-1V1c0-.55-.45-1-1-1zm-4 4H1c-.55 0-1 .45-1 1v10c0 .55.45 1 1 1h10c.55 0 1-.45 1-1V5c0-.55-.45-1-1-1zm-1 10H2V6h8v8z"
-                  fill-rule="evenodd"
-                />
-              </svg>
-            </span>
-            <span
-              class="bp4-button-text"
+                <svg
+                  data-icon="duplicate"
+                  height="16"
+                  role="img"
+                  viewBox="0 0 16 16"
+                  width="16"
+                >
+                  <path
+                    d="M15 0H5c-.55 0-1 .45-1 1v2h2V2h8v7h-1v2h2c.55 0 1-.45 1-1V1c0-.55-.45-1-1-1zm-4 4H1c-.55 0-1 .45-1 1v10c0 .55.45 1 1 1h10c.55 0 1-.45 1-1V5c0-.55-.45-1-1-1zm-1 10H2V6h8v8z"
+                    fill-rule="evenodd"
+                  />
+                </svg>
+              </span>
+              <span
+                class="bp4-button-text"
+              >
+                Copy
+              </span>
+            </button>
+            <button
+              class="bp4-button bp4-intent-primary"
+              type="button"
             >
-              Copy
-            </span>
-          </button>
-          <button
-            class="bp4-button bp4-intent-primary"
-            type="button"
-          >
-            <span
-              class="bp4-button-text"
-            >
-              Close
-            </span>
-          </button>
+              <span
+                class="bp4-button-text"
+              >
+                Close
+              </span>
+            </button>
+          </div>
         </div>
       </div>
     </div>
diff --git a/web-console/src/dialogs/show-value-dialog/show-value-dialog.scss b/web-console/src/dialogs/show-value-dialog/show-value-dialog.scss
index a1da01e5931..f561f1bf99f 100644
--- a/web-console/src/dialogs/show-value-dialog/show-value-dialog.scss
+++ b/web-console/src/dialogs/show-value-dialog/show-value-dialog.scss
@@ -19,10 +19,6 @@
 @import '../../variables';
 
 .show-value-dialog {
-  &.#{$bp-ns}-dialog {
-    padding-bottom: 10px;
-  }
-
   &.normal.#{$bp-ns}-dialog {
     height: 600px;
   }
@@ -32,12 +28,21 @@
     height: 90vh;
   }
 
-  .#{$bp-ns}-input {
-    margin: 10px;
-    flex: 1;
+  .#{$bp-ns}-dialog-body {
+    display: flex;
+    flex-direction: column;
+
+    .ace-editor {
+      flex: 1;
+    }
+
+    .#{$bp-ns}-input {
+      flex: 1;
+      resize: none;
+    }
   }
 
-  .#{$bp-ns}-dialog-footer-actions {
-    padding-right: 10px;
+  .#{$bp-ns}-dialog-footer {
+    margin-top: 0;
   }
 }
diff --git a/web-console/src/dialogs/show-value-dialog/show-value-dialog.tsx b/web-console/src/dialogs/show-value-dialog/show-value-dialog.tsx
index 8e1b0290865..4369a43bb76 100644
--- a/web-console/src/dialogs/show-value-dialog/show-value-dialog.tsx
+++ b/web-console/src/dialogs/show-value-dialog/show-value-dialog.tsx
@@ -16,11 +16,21 @@
  * limitations under the License.
  */
 
-import { Button, Classes, Dialog, Intent, TextArea } from '@blueprintjs/core';
+import {
+  Button,
+  ButtonGroup,
+  Classes,
+  Dialog,
+  FormGroup,
+  Intent,
+  TextArea,
+} from '@blueprintjs/core';
 import { IconNames } from '@blueprintjs/icons';
 import classNames from 'classnames';
 import copy from 'copy-to-clipboard';
-import React from 'react';
+import * as JSONBig from 'json-bigint-native';
+import React, { useMemo, useState } from 'react';
+import AceEditor from 'react-ace';
 
 import { AppToaster } from '../../singletons';
 
@@ -35,6 +45,15 @@ export interface ShowValueDialogProps {
 
 export const ShowValueDialog = React.memo(function ShowValueDialog(props: ShowValueDialogProps) {
   const { title, onClose, str, size } = props;
+  const [tab, setTab] = useState<'formatted' | 'raw'>('formatted');
+
+  const parsed = useMemo(() => {
+    try {
+      return JSONBig.parse(str);
+    } catch {}
+  }, [str]);
+
+  const hasParsed = typeof parsed !== 'undefined';
 
   function handleCopy() {
     copy(str, { format: 'text/plain' });
@@ -51,10 +70,41 @@ export const ShowValueDialog = React.memo(function ShowValueDialog(props: ShowVa
       onClose={onClose}
       title={title || 'Full value'}
     >
-      <TextArea value={str} spellCheck={false} />
-      <div className={Classes.DIALOG_FOOTER_ACTIONS}>
-        <Button icon={IconNames.DUPLICATE} text="Copy" onClick={handleCopy} />
-        <Button text="Close" intent={Intent.PRIMARY} onClick={onClose} />
+      <div className={Classes.DIALOG_BODY}>
+        {hasParsed && (
+          <FormGroup>
+            <ButtonGroup fill>
+              <Button
+                text="Formatted"
+                active={tab === 'formatted'}
+                onClick={() => setTab('formatted')}
+              />
+              <Button text="Raw" active={tab === 'raw'} onClick={() => setTab('raw')} />
+            </ButtonGroup>
+          </FormGroup>
+        )}
+        {hasParsed && tab === 'formatted' && (
+          <AceEditor
+            mode="hjson"
+            theme="solarized_dark"
+            className="query-string"
+            name="ace-editor"
+            fontSize={12}
+            width="100%"
+            height="100%"
+            showGutter
+            showPrintMargin={false}
+            value={JSONBig.stringify(parsed, undefined, 2)}
+            readOnly
+          />
+        )}
+        {(!hasParsed || tab === 'raw') && <TextArea value={str} spellCheck={false} />}
+      </div>
+      <div className={Classes.DIALOG_FOOTER}>
+        <div className={Classes.DIALOG_FOOTER_ACTIONS}>
+          <Button icon={IconNames.DUPLICATE} text="Copy" onClick={handleCopy} />
+          <Button text="Close" intent={Intent.PRIMARY} onClick={onClose} />
+        </div>
       </div>
     </Dialog>
   );
diff --git a/web-console/src/views/workbench-view/column-tree/column-tree-menu/string-menu-items/string-menu-items.tsx b/web-console/src/views/workbench-view/column-tree/column-tree-menu/string-menu-items/string-menu-items.tsx
index 8c95ffd15ce..0dc0c684e45 100644
--- a/web-console/src/views/workbench-view/column-tree/column-tree-menu/string-menu-items/string-menu-items.tsx
+++ b/web-console/src/views/workbench-view/column-tree/column-tree-menu/string-menu-items/string-menu-items.tsx
@@ -136,7 +136,7 @@ export const StringMenuItems = React.memo(function StringMenuItems(props: String
       <MenuItem icon={IconNames.FUNCTION} text="Aggregate">
         {aggregateMenuItem(F.countDistinct(column), `dist_${columnName}`)}
         {aggregateMenuItem(
-          F.count().addWhereExpression(column.equal(SqlPlaceholder.PLACEHOLDER)),
+          F.count().addWhere(column.equal(SqlPlaceholder.PLACEHOLDER)),
           `filtered_dist_${columnName}`,
           false,
         )}
diff --git a/web-console/src/views/workbench-view/result-table-pane/result-table-pane.tsx b/web-console/src/views/workbench-view/result-table-pane/result-table-pane.tsx
index cf8fc753ecc..6f2bff79873 100644
--- a/web-console/src/views/workbench-view/result-table-pane/result-table-pane.tsx
+++ b/web-console/src/views/workbench-view/result-table-pane/result-table-pane.tsx
@@ -657,7 +657,9 @@ export const ResultTablePane = React.memo(function ResultTablePane(props: Result
           })}
         />
       )}
-      {showValue && <ShowValueDialog onClose={() => setShowValue(undefined)} str={showValue} />}
+      {showValue && (
+        <ShowValueDialog onClose={() => setShowValue(undefined)} str={showValue} size="large" />
+      )}
       {editingExpression && (
         <ExpressionEditorDialog
           includeOutputName
diff --git a/web-console/src/views/workbench-view/run-panel/run-panel.tsx b/web-console/src/views/workbench-view/run-panel/run-panel.tsx
index 5d9c9852791..3c9b68ddb7c 100644
--- a/web-console/src/views/workbench-view/run-panel/run-panel.tsx
+++ b/web-console/src/views/workbench-view/run-panel/run-panel.tsx
@@ -535,7 +535,7 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
       )}
       {editContextDialogOpen && (
         <EditContextDialog
-          queryContext={queryContext}
+          initQueryContext={queryContext}
           onQueryContextChange={changeQueryContext}
           onClose={() => {
             setEditContextDialogOpen(false);

From a63c12bf3460308489a2b28ae7937670ac5aaa28 Mon Sep 17 00:00:00 2001
From: Rishabh Singh <6513075+findingrish@users.noreply.github.com>
Date: Sat, 22 Jun 2024 11:45:54 +0530
Subject: [PATCH 09/72] Upload tasklogs along with service logs on Standard IT
 failure (#16631)

* Fix build

* Push tasklogs alongwith service logs

* temp changes to run standard its without unit test results

* test

* minor change

* test

* test

* Update datasource name for ITSystemTableBatchIndexTaskTest

* Publish task logs

* Revert other changes

* update standard-it yaml
---
 .github/workflows/reusable-standard-its.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/reusable-standard-its.yml b/.github/workflows/reusable-standard-its.yml
index ecc9c3d6544..b9bb8bb2d56 100644
--- a/.github/workflows/reusable-standard-its.yml
+++ b/.github/workflows/reusable-standard-its.yml
@@ -113,7 +113,7 @@ jobs:
       - name: Collect service logs on failure
         if: ${{ failure() && steps.run-it.conclusion == 'failure' }}
         run: |
-          tar cvzf ./service-logs.tgz ~/shared/logs
+          tar cvzf ./service-logs.tgz ~/shared/logs ~/shared/tasklogs
 
       - name: Upload Druid service logs to GitHub
         if: ${{ failure() && steps.run-it.conclusion == 'failure' }}

From 00c96432afc378fb68aa7ebe9cd115f88c350c5b Mon Sep 17 00:00:00 2001
From: Laksh Singla <lakshsingla@gmail.com>
Date: Sun, 23 Jun 2024 23:15:45 +0530
Subject: [PATCH 10/72] Materialize scan results correctly when columns are not
 present in the segments (#16619)

Fixes a bug causing maxSubqueryBytes not to work when segments have missing columns.
---
 .../scan/ScanResultValueFramesIterable.java   | 120 ++++++++---
 .../ScanResultValueFramesIterableTest.java    | 192 +++++++++++++++--
 .../sql/calcite/BaseCalciteQueryTest.java     |   2 +
 .../sql/calcite/CalciteSubqueryTest.java      | 202 ++++++++++++++++++
 4 files changed, 466 insertions(+), 50 deletions(-)

diff --git a/processing/src/main/java/org/apache/druid/query/scan/ScanResultValueFramesIterable.java b/processing/src/main/java/org/apache/druid/query/scan/ScanResultValueFramesIterable.java
index 42f57628461..2f3b988d34a 100644
--- a/processing/src/main/java/org/apache/druid/query/scan/ScanResultValueFramesIterable.java
+++ b/processing/src/main/java/org/apache/druid/query/scan/ScanResultValueFramesIterable.java
@@ -22,6 +22,9 @@ package org.apache.druid.query.scan;
 import com.google.common.base.Function;
 import com.google.common.collect.Iterables;
 import com.google.common.collect.Lists;
+import it.unimi.dsi.fastutil.ints.IntArrayList;
+import it.unimi.dsi.fastutil.ints.IntList;
+import org.apache.druid.error.DruidException;
 import org.apache.druid.frame.Frame;
 import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.MemoryAllocatorFactory;
@@ -36,6 +39,7 @@ import org.apache.druid.java.util.common.io.Closer;
 import org.apache.druid.query.FrameSignaturePair;
 import org.apache.druid.query.IterableRowsCursorHelper;
 import org.apache.druid.segment.Cursor;
+import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.RowSignature;
 
 import java.io.Closeable;
@@ -157,17 +161,41 @@ public class ScanResultValueFramesIterable implements Iterable<FrameSignaturePai
     Cursor currentCursor = null;
 
     /**
-     * Row signature of the current row
+     * Rows in the List form. The {@link #currentCursor} is a wrapper over these rows
      */
-    RowSignature currentRowSignature = null;
+    List<Object[]> currentRows = null;
 
+    /**
+     * Row index pointing to the current row in {@link #currentRows}. This is the exact same row that the {@link #currentCursor}
+     * is also pointing at. Therefore {@link #currentRows} + {@link #currentCursor} represent the same information as presented
+     * by {@link #currentCursor}.
+     */
+    int currentRowIndex = -1;
+
+    /**
+     * Full row signature of the ScanResultValue, used to extract the rows out of it.
+     */
+    RowSignature currentInputRowSignature = null;
+
+    /**
+     * Row signature of the ScanResultValue, with columns having unknown (null) types trimmed out. This is used to write
+     * the rows onto the frame. There's an implicit assumption (that we verify), that columns with null typed only
+     * contain null values, because the underlying segment didn't have the column.
+     */
+    RowSignature currentOutputRowSignature = null;
+
+    /**
+     * Columns of the currentRows with missing type information. As we materialize the rows onto the frames, we also
+     * verify that these columns only contain null values.
+     */
+    IntList nullTypedColumns = null;
 
     public ScanResultValueFramesIterator(
-        Sequence<ScanResultValue> resultSequence,
-        MemoryAllocatorFactory memoryAllocatorFactory,
-        boolean useNestedForUnknownTypes,
-        RowSignature defaultRowSignature,
-        Function<RowSignature, Function<?, Object[]>> resultFormatMapper
+        final Sequence<ScanResultValue> resultSequence,
+        final MemoryAllocatorFactory memoryAllocatorFactory,
+        final boolean useNestedForUnknownTypes,
+        final RowSignature defaultRowSignature,
+        final Function<RowSignature, Function<?, Object[]>> resultFormatMapper
     )
     {
       this.memoryAllocatorFactory = memoryAllocatorFactory;
@@ -200,26 +228,35 @@ public class ScanResultValueFramesIterable implements Iterable<FrameSignaturePai
       // start all the processing
       populateCursor();
       boolean firstRowWritten = false;
-      // While calling populateCursor() repeatedly, currentRowSignature might change. Therefore we store the signature
-      // with which we have written the frames
-      final RowSignature writtenSignature = currentRowSignature;
-      FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
+
+      final FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
           FrameType.COLUMNAR,
           memoryAllocatorFactory,
-          currentRowSignature,
+          currentOutputRowSignature,
           Collections.emptyList()
       );
-      Frame frame;
-      try (final FrameWriter frameWriter = frameWriterFactory.newFrameWriter(new SettableCursorColumnSelectorFactory(
-          () -> currentCursor,
-          currentRowSignature
-      ))) {
+      final Frame frame;
+      try (final FrameWriter frameWriter = frameWriterFactory.newFrameWriter(
+          new SettableCursorColumnSelectorFactory(() -> currentCursor, currentInputRowSignature))) {
         while (populateCursor()) { // Do till we don't have any more rows, or the next row isn't compatible with the current row
           if (!frameWriter.addSelection()) { // Add the cursor's row to the frame, till the frame is full
             break;
           }
+
+          // Check that the columns with the null types are actually null before advancing
+          final Object[] currentRow = currentRows.get(currentRowIndex);
+          for (Integer columnNumber : nullTypedColumns) {
+            if (currentRow[columnNumber] != null) {
+              throw DruidException.defensive(
+                  "Expected a null value for column [%s]",
+                  frameWriterFactory.signature().getColumnName(columnNumber)
+              );
+            }
+          }
+
           firstRowWritten = true;
           currentCursor.advance();
+          currentRowIndex++;
         }
 
         if (!firstRowWritten) {
@@ -228,7 +265,9 @@ public class ScanResultValueFramesIterable implements Iterable<FrameSignaturePai
         frame = Frame.wrap(frameWriter.toByteArray());
       }
 
-      return new FrameSignaturePair(frame, writtenSignature);
+      // While calling populateCursor() repeatedly, currentRowSignature might change. Therefore, we store the signature
+      // with which we have written the frames
+      return new FrameSignaturePair(frame, frameWriterFactory.signature());
     }
 
     /**
@@ -244,7 +283,7 @@ public class ScanResultValueFramesIterable implements Iterable<FrameSignaturePai
 
     /**
      * This is the most important method of this iterator. This determines if two consecutive scan result values can
-     * be batched or not, populates the value of the {@link #currentCursor} and {@link #currentRowSignature},
+     * be batched or not, populates the value of the {@link #currentCursor} and {@link #currentInputRowSignature},
      * during the course of the iterator, and facilitates the {@link #next()}
      * <p>
      * Multiple calls to populateCursor, without advancing the {@link #currentCursor} is idempotent. This allows successive
@@ -257,7 +296,9 @@ public class ScanResultValueFramesIterable implements Iterable<FrameSignaturePai
      * if (hasNext()) was true before calling the method -
      * 1. {@link #currentCursor} - Points to the cursor with non-empty value (i.e. isDone()) is false, and the cursor points
      * to the next row present in the sequence of the scan result values. This row would get materialized to frame
-     * 2. {@link #currentRowSignature} - Row signature of the row.
+     * 2. {@link #currentInputRowSignature} - Row signature of the row
+     * 3. {@link #currentRows} - Points to the group of rows underlying the currentCursor
+     * 4. {@link #currentRowIndex} - Reset to 0 if we modified the cursor, else untouched
      * <p>
      * Return value -
      * if (hasNext()) is false before calling the method - returns false
@@ -275,25 +316,42 @@ public class ScanResultValueFramesIterable implements Iterable<FrameSignaturePai
 
       // At this point, we know that we need to move to the next non-empty cursor, AND it exists, because
       // done() is not false
-      ScanResultValue scanResultValue = resultSequenceIterator.next();
+      final ScanResultValue scanResultValue = resultSequenceIterator.next();
+
       final RowSignature rowSignature = scanResultValue.getRowSignature() != null
                                         ? scanResultValue.getRowSignature()
                                         : defaultRowSignature;
-      RowSignature modifiedRowSignature = useNestedForUnknownTypes
+
+      final RowSignature modifiedRowSignature = useNestedForUnknownTypes
                                           ? FrameWriterUtils.replaceUnknownTypesWithNestedColumns(rowSignature)
                                           : rowSignature;
 
-      // currentRowSignature at this time points to the previous row's signature
-      final boolean compatible = modifiedRowSignature != null
-                                 && modifiedRowSignature.equals(currentRowSignature);
+      final IntList currentNullTypedColumns = new IntArrayList();
+      final RowSignature.Builder modifiedTrimmedRowSignatureBuilder = RowSignature.builder();
+
+      for (int i = 0; i < modifiedRowSignature.size(); ++i) {
+        ColumnType columnType = modifiedRowSignature.getColumnType(i).orElse(null);
+        if (columnType == null) {
+          currentNullTypedColumns.add(i);
+        } else {
+          modifiedTrimmedRowSignatureBuilder.add(modifiedRowSignature.getColumnName(i), columnType);
+        }
+      }
+
+      final RowSignature modifiedTrimmedRowSignature = modifiedTrimmedRowSignatureBuilder.build();
+
+      // currentRowSignature at this time points to the previous row's signature. We look at the trimmed signature
+      // because that is the one used to write onto the frames, and if two rows have same trimmed signature, we can
+      // write both the rows onto the same frame
+      final boolean compatible = modifiedTrimmedRowSignature.equals(currentOutputRowSignature);
 
       final List rows = (List) scanResultValue.getEvents();
-      final Iterable<Object[]> formattedRows = Lists.newArrayList(Iterables.transform(
+      final List<Object[]> formattedRows = Lists.newArrayList(Iterables.transform(
           rows,
           (Function) resultFormatMapper.apply(modifiedRowSignature)
       ));
 
-      Pair<Cursor, Closeable> cursorAndCloseable = IterableRowsCursorHelper.getCursorFromIterable(
+      final Pair<Cursor, Closeable> cursorAndCloseable = IterableRowsCursorHelper.getCursorFromIterable(
           formattedRows,
           modifiedRowSignature
       );
@@ -306,7 +364,13 @@ public class ScanResultValueFramesIterable implements Iterable<FrameSignaturePai
         return populateCursor();
       }
 
-      currentRowSignature = modifiedRowSignature;
+      currentInputRowSignature = modifiedRowSignature;
+      currentOutputRowSignature = modifiedTrimmedRowSignature;
+      nullTypedColumns = currentNullTypedColumns;
+      currentRows = formattedRows;
+      currentRowIndex = 0;
+
+
       return compatible;
     }
   }
diff --git a/processing/src/test/java/org/apache/druid/query/scan/ScanResultValueFramesIterableTest.java b/processing/src/test/java/org/apache/druid/query/scan/ScanResultValueFramesIterableTest.java
index bdd64c1c8bd..8ffaa45de79 100644
--- a/processing/src/test/java/org/apache/druid/query/scan/ScanResultValueFramesIterableTest.java
+++ b/processing/src/test/java/org/apache/druid/query/scan/ScanResultValueFramesIterableTest.java
@@ -21,7 +21,9 @@ package org.apache.druid.query.scan;
 
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.Lists;
+import org.apache.druid.error.DruidException;
 import org.apache.druid.frame.allocation.ArenaMemoryAllocatorFactory;
+import org.apache.druid.java.util.common.guava.Sequence;
 import org.apache.druid.java.util.common.guava.Sequences;
 import org.apache.druid.query.FrameBasedInlineDataSource;
 import org.apache.druid.query.FrameSignaturePair;
@@ -55,6 +57,18 @@ public class ScanResultValueFramesIterableTest extends InitializedNullHandlingTe
                                                              .add("col2", ColumnType.LONG)
                                                              .build();
 
+  private static final RowSignature SIGNATURE3 = RowSignature.builder()
+                                                             .add("col1", ColumnType.DOUBLE)
+                                                             .add("col2", ColumnType.LONG)
+                                                             .add("col3", null)
+                                                             .build();
+
+  private static final RowSignature SIGNATURE4 = RowSignature.builder()
+                                                             .add("col1", ColumnType.DOUBLE)
+                                                             .add("col3", null)
+                                                             .add("col2", ColumnType.LONG)
+                                                             .build();
+
 
   @Test
   public void testEmptySequence()
@@ -97,10 +111,10 @@ public class ScanResultValueFramesIterableTest extends InitializedNullHandlingTe
     Assert.assertEquals(1, frames.size());
     QueryToolChestTestHelper.assertArrayResultsEquals(
         ImmutableList.of(
-            new Object[]{1L, 1.0D},
-            new Object[]{2L, 2.0D},
-            new Object[]{1L, 1.0D},
-            new Object[]{2L, 2.0D}
+            new Object[]{1000L, 1100.0D},
+            new Object[]{1001L, 1101.0D},
+            new Object[]{1000L, 1100.0D},
+            new Object[]{1001L, 1101.0D}
         ),
         new FrameBasedInlineDataSource(frames, SIGNATURE1).getRowsAsSequence()
     );
@@ -153,10 +167,10 @@ public class ScanResultValueFramesIterableTest extends InitializedNullHandlingTe
       Assert.assertEquals(1, frames.size());
       QueryToolChestTestHelper.assertArrayResultsEquals(
           ImmutableList.of(
-              new Object[]{1L, 1.0D},
-              new Object[]{2L, 2.0D},
-              new Object[]{1L, 1.0D},
-              new Object[]{2L, 2.0D}
+              new Object[]{1000L, 1100.0D},
+              new Object[]{1001L, 1101.0D},
+              new Object[]{1000L, 1100.0D},
+              new Object[]{1001L, 1101.0D}
           ),
           new FrameBasedInlineDataSource(frames, SIGNATURE1).getRowsAsSequence()
       );
@@ -177,17 +191,43 @@ public class ScanResultValueFramesIterableTest extends InitializedNullHandlingTe
     Assert.assertEquals(2, frames.size());
     QueryToolChestTestHelper.assertArrayResultsEquals(
         ImmutableList.of(
-            new Object[]{1L, 1.0D},
-            new Object[]{2L, 2.0D}
+            new Object[]{1000L, 1100.0D},
+            new Object[]{1001L, 1101.0D}
         ),
-        new FrameBasedInlineDataSource(Collections.singletonList(frames.get(0)), SIGNATURE1).getRowsAsSequence()
+        new FrameBasedInlineDataSource(frames.subList(0, 1), SIGNATURE1).getRowsAsSequence()
     );
     QueryToolChestTestHelper.assertArrayResultsEquals(
         ImmutableList.of(
-            new Object[]{3.0D, 3L},
-            new Object[]{4.0D, 4L}
+            new Object[]{2000.0D, 2100L},
+            new Object[]{2001.0D, 2101L}
         ),
-        new FrameBasedInlineDataSource(Collections.singletonList(frames.get(1)), SIGNATURE2).getRowsAsSequence()
+        new FrameBasedInlineDataSource(frames.subList(1, 2), SIGNATURE2).getRowsAsSequence()
+    );
+  }
+
+  @Test
+  public void testBatchingWithHeterogenousScanResultValuesAndNullTypes()
+  {
+    List<FrameSignaturePair> frames = Lists.newArrayList(
+        createIterable(
+            scanResultValue1(2),
+            scanResultValue3(2)
+        )
+    );
+    Assert.assertEquals(2, frames.size());
+    QueryToolChestTestHelper.assertArrayResultsEquals(
+        ImmutableList.of(
+            new Object[]{1000L, 1100.0D},
+            new Object[]{1001L, 1101.0D}
+        ),
+        new FrameBasedInlineDataSource(frames.subList(0, 1), SIGNATURE1).getRowsAsSequence()
+    );
+    QueryToolChestTestHelper.assertArrayResultsEquals(
+        ImmutableList.of(
+            new Object[]{3000.0D, 3100L},
+            new Object[]{3001.0D, 3101L}
+        ),
+        new FrameBasedInlineDataSource(frames.subList(1, 2), SIGNATURE2).getRowsAsSequence()
     );
   }
 
@@ -208,20 +248,85 @@ public class ScanResultValueFramesIterableTest extends InitializedNullHandlingTe
     Assert.assertEquals(2, frames.size());
     QueryToolChestTestHelper.assertArrayResultsEquals(
         ImmutableList.of(
-            new Object[]{1L, 1.0D},
-            new Object[]{2L, 2.0D}
+            new Object[]{1000L, 1100.0D},
+            new Object[]{1001L, 1101.0D}
         ),
-        new FrameBasedInlineDataSource(Collections.singletonList(frames.get(0)), SIGNATURE1).getRowsAsSequence()
+        new FrameBasedInlineDataSource(frames.subList(0, 1), SIGNATURE1).getRowsAsSequence()
     );
     QueryToolChestTestHelper.assertArrayResultsEquals(
         ImmutableList.of(
-            new Object[]{3.0D, 3L},
-            new Object[]{4.0D, 4L}
+            new Object[]{2000.0D, 2100L},
+            new Object[]{2001.0D, 2101L}
         ),
-        new FrameBasedInlineDataSource(Collections.singletonList(frames.get(1)), SIGNATURE2).getRowsAsSequence()
+        new FrameBasedInlineDataSource(frames.subList(1, 2), SIGNATURE2).getRowsAsSequence()
     );
   }
 
+  @Test
+  public void testBatchingWithHeterogenousAndEmptyScanResultValuesAndNullTypes()
+  {
+    List<FrameSignaturePair> frames = Lists.newArrayList(
+        createIterable(
+            scanResultValue1(0),
+            scanResultValue2(0),
+            scanResultValue1(2),
+            scanResultValue1(0),
+            scanResultValue2(2),
+            scanResultValue2(0),
+            scanResultValue2(0)
+        )
+    );
+    Assert.assertEquals(2, frames.size());
+    QueryToolChestTestHelper.assertArrayResultsEquals(
+        ImmutableList.of(
+            new Object[]{1000L, 1100.0D},
+            new Object[]{1001L, 1101.0D}
+        ),
+        new FrameBasedInlineDataSource(frames.subList(0, 1), SIGNATURE1).getRowsAsSequence()
+    );
+    QueryToolChestTestHelper.assertArrayResultsEquals(
+        ImmutableList.of(
+            new Object[]{2000.0D, 2100L},
+            new Object[]{2001.0D, 2101L}
+        ),
+        new FrameBasedInlineDataSource(frames.subList(1, 2), SIGNATURE2).getRowsAsSequence()
+    );
+  }
+
+  @Test
+  public void testBatchingWithDifferentRowSignaturesButSameTrimmedRowSignature()
+  {
+    List<FrameSignaturePair> frames = Lists.newArrayList(
+        createIterable(
+            scanResultValue3(0),
+            scanResultValue4(0),
+            scanResultValue3(2),
+            scanResultValue3(0),
+            scanResultValue4(2),
+            scanResultValue4(0),
+            scanResultValue3(0)
+        )
+    );
+    Assert.assertEquals(1, frames.size());
+    QueryToolChestTestHelper.assertArrayResultsEquals(
+        ImmutableList.of(
+            new Object[]{3000.0D, 3100L},
+            new Object[]{3001.0D, 3101L},
+            new Object[]{4000.0D, 4100L},
+            new Object[]{4001.0D, 4101L}
+        ),
+        new FrameBasedInlineDataSource(frames, SIGNATURE2).getRowsAsSequence()
+    );
+  }
+
+  @Test
+  public void testExceptionThrownWithMissingType()
+  {
+    Sequence<FrameSignaturePair> frames = Sequences.simple(createIterable(incompleteTypeScanResultValue(1)));
+    Assert.assertThrows(DruidException.class, frames::toList);
+  }
+
+
   @Test
   public void testSplitting()
   {
@@ -252,7 +357,9 @@ public class ScanResultValueFramesIterableTest extends InitializedNullHandlingTe
     return new ScanResultValue(
         "dummy",
         ImmutableList.of("col1", "col2"),
-        IntStream.range(1, 1 + numRows).mapToObj(i -> new Object[]{i, (double) i}).collect(Collectors.toList()),
+        IntStream.range(1000, 1000 + numRows)
+                 .mapToObj(i -> new Object[]{i, (double) i + 100})
+                 .collect(Collectors.toList()),
         SIGNATURE1
     );
   }
@@ -263,8 +370,49 @@ public class ScanResultValueFramesIterableTest extends InitializedNullHandlingTe
     return new ScanResultValue(
         "dummy",
         ImmutableList.of("col1", "col2"),
-        IntStream.range(3, 3 + numRows).mapToObj(i -> new Object[]{(double) i, i}).collect(Collectors.toList()),
+        IntStream.range(2000, 2000 + numRows)
+                 .mapToObj(i -> new Object[]{(double) i, i + 100})
+                 .collect(Collectors.toList()),
         SIGNATURE2
     );
   }
+
+  // Signature: col1: DOUBLE, col2: LONG, col3: null
+  private static ScanResultValue scanResultValue3(int numRows)
+  {
+    return new ScanResultValue(
+        "dummy",
+        ImmutableList.of("col1", "col2", "col3"),
+        IntStream.range(3000, 3000 + numRows)
+                 .mapToObj(i -> new Object[]{(double) i, i + 100, null})
+                 .collect(Collectors.toList()),
+        SIGNATURE3
+    );
+  }
+
+  // Signature: col1: DOUBLE, col3: null, col2: LONG
+  private static ScanResultValue scanResultValue4(int numRows)
+  {
+    return new ScanResultValue(
+        "dummy",
+        ImmutableList.of("col1", "col3", "col2"),
+        IntStream.range(4000, 4000 + numRows)
+                 .mapToObj(i -> new Object[]{(double) i, null, i + 100})
+                 .collect(Collectors.toList()),
+        SIGNATURE4
+    );
+  }
+
+  // Contains ScanResultValue with incomplete type, and non-null row
+  private static ScanResultValue incompleteTypeScanResultValue(int numRows)
+  {
+    return new ScanResultValue(
+        "dummy",
+        ImmutableList.of("col1", "col3", "col2"),
+        IntStream.range(5000, 5000 + numRows)
+                 .mapToObj(i -> new Object[]{(double) i, i + 100, i + 200})
+                 .collect(Collectors.toList()),
+        SIGNATURE4
+    );
+  }
 }
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java
index dfee7d0e3a2..606710ff53b 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java
@@ -256,6 +256,8 @@ public class BaseCalciteQueryTest extends CalciteTestBase
       ImmutableMap.<String, Object>builder()
                   .putAll(QUERY_CONTEXT_DEFAULT)
                   .put(QueryContexts.MAX_SUBQUERY_BYTES_KEY, "100000")
+                  // Disallows the fallback to row based limiting
+                  .put(QueryContexts.MAX_SUBQUERY_ROWS_KEY, "1")
                   .build();
 
   // Add additional context to the given context map for when the
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSubqueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSubqueryTest.java
index 808ab5c3663..6269e2a5c8c 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSubqueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSubqueryTest.java
@@ -20,7 +20,15 @@
 package org.apache.druid.sql.calcite;
 
 import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.data.input.InputRow;
+import org.apache.druid.data.input.InputRowSchema;
+import org.apache.druid.data.input.impl.DimensionsSpec;
+import org.apache.druid.data.input.impl.MapInputRowParser;
+import org.apache.druid.data.input.impl.StringDimensionSchema;
+import org.apache.druid.data.input.impl.TimestampSpec;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.UOE;
@@ -31,6 +39,7 @@ import org.apache.druid.query.Druids;
 import org.apache.druid.query.JoinDataSource;
 import org.apache.druid.query.QueryContexts;
 import org.apache.druid.query.QueryDataSource;
+import org.apache.druid.query.QueryRunnerFactoryConglomerate;
 import org.apache.druid.query.ResourceLimitExceededException;
 import org.apache.druid.query.TableDataSource;
 import org.apache.druid.query.aggregation.CountAggregatorFactory;
@@ -54,12 +63,21 @@ import org.apache.druid.query.ordering.StringComparators;
 import org.apache.druid.query.scan.ScanQuery;
 import org.apache.druid.query.topn.DimensionTopNMetricSpec;
 import org.apache.druid.query.topn.TopNQueryBuilder;
+import org.apache.druid.segment.IndexBuilder;
+import org.apache.druid.segment.QueryableIndex;
 import org.apache.druid.segment.VirtualColumns;
 import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.incremental.IncrementalIndexSchema;
 import org.apache.druid.segment.join.JoinType;
+import org.apache.druid.segment.join.JoinableFactoryWrapper;
+import org.apache.druid.segment.writeout.OnHeapMemorySegmentWriteOutMediumFactory;
+import org.apache.druid.server.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.expression.DruidExpression;
 import org.apache.druid.sql.calcite.filtration.Filtration;
 import org.apache.druid.sql.calcite.util.CalciteTests;
+import org.apache.druid.sql.calcite.util.SqlTestFramework;
+import org.apache.druid.timeline.DataSegment;
+import org.apache.druid.timeline.partition.LinearShardSpec;
 import org.hamcrest.CoreMatchers;
 import org.joda.time.DateTimeZone;
 import org.joda.time.Period;
@@ -67,12 +85,14 @@ import org.junit.internal.matchers.ThrowableMessageMatcher;
 import org.junit.jupiter.params.ParameterizedTest;
 import org.junit.jupiter.params.provider.MethodSource;
 
+import java.io.File;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
+import java.util.stream.Collectors;
 
 import static org.junit.Assert.assertThrows;
 import static org.junit.jupiter.api.Assertions.assertTrue;
@@ -84,6 +104,7 @@ import static org.junit.jupiter.api.Assertions.assertTrue;
  * 1. Where the memory limit is not set. The intermediate results are materialized as inline rows
  * 2. Where the memory limit is set. The intermediate results are materialized as frames
  */
+@SqlTestFrameworkConfig.ComponentSupplier(CalciteSubqueryTest.SubqueryComponentSupplier.class)
 public class CalciteSubqueryTest extends BaseCalciteQueryTest
 {
   public static Iterable<Object[]> constructorFeeder()
@@ -147,6 +168,57 @@ public class CalciteSubqueryTest extends BaseCalciteQueryTest
     );
   }
 
+  @MethodSource("constructorFeeder")
+  @ParameterizedTest(name = "{0}")
+  public void testSubqueryOnDataSourceWithMissingColumnsInSegments(String testName, Map<String, Object> queryContext)
+  {
+    if (!queryContext.containsKey(QueryContexts.MAX_SUBQUERY_BYTES_KEY)) {
+      cannotVectorize();
+    }
+    testQuery(
+        "SELECT\n"
+        + "  __time,\n"
+        + "  col1,\n"
+        + "  col2,\n"
+        + "  col3,\n"
+        + "  COUNT(*)\n"
+        + "FROM (SELECT * FROM dsMissingCol LIMIT 10)\n"
+        + "GROUP BY 1, 2, 3, 4",
+        queryContext,
+        ImmutableList.of(
+            GroupByQuery.builder()
+                        .setDataSource(
+                            new QueryDataSource(
+                                newScanQueryBuilder()
+                                    .dataSource("dsMissingCol")
+                                    .intervals(querySegmentSpec(Filtration.eternity()))
+                                    .columns("__time", "col1", "col2", "col3")
+                                    .resultFormat(ScanQuery.ResultFormat.RESULT_FORMAT_COMPACTED_LIST)
+                                    .limit(10)
+                                    .build()
+                            )
+                        )
+                        .setInterval(querySegmentSpec(Filtration.eternity()))
+                        .setGranularity(Granularities.ALL)
+                        .setDimensions(
+                            new DefaultDimensionSpec("__time", "d0", ColumnType.LONG),
+                            new DefaultDimensionSpec("col1", "d1", ColumnType.STRING),
+                            new DefaultDimensionSpec("col2", "d2", ColumnType.STRING),
+                            new DefaultDimensionSpec("col3", "d3", ColumnType.STRING)
+                        )
+                        .setAggregatorSpecs(aggregators(
+                            new CountAggregatorFactory("a0")
+                        ))
+                        .setContext(queryContext)
+                        .build()
+        ),
+        ImmutableList.of(
+            new Object[]{946684800000L, "abc", NullHandling.defaultStringValue(), "def", 1L},
+            new Object[]{946684800000L, "foo", "bar", NullHandling.defaultStringValue(), 1L}
+        )
+    );
+  }
+
   @MethodSource("constructorFeeder")
   @ParameterizedTest(name = "{0}")
   public void testExactCountDistinctOfSemiJoinResult(String testName, Map<String, Object> queryContext)
@@ -1315,4 +1387,134 @@ public class CalciteSubqueryTest extends BaseCalciteQueryTest
         ImmutableList.of()
     );
   }
+
+  public static class SubqueryComponentSupplier extends SqlTestFramework.StandardComponentSupplier
+  {
+
+    private final TempDirProducer tmpDirProducer;
+
+    public SubqueryComponentSupplier(TempDirProducer tempDirProducer)
+    {
+      super(tempDirProducer);
+      this.tmpDirProducer = tempDirProducer;
+    }
+
+    @Override
+    public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
+        QueryRunnerFactoryConglomerate conglomerate,
+        JoinableFactoryWrapper joinableFactory,
+        Injector injector
+    )
+    {
+      SpecificSegmentsQuerySegmentWalker walker =
+          super.createQuerySegmentWalker(conglomerate, joinableFactory, injector);
+
+      final String datasource1 = "dsMissingCol";
+      final File tmpFolder = tempDirProducer.newTempFolder();
+
+      final List<ImmutableMap<String, Object>> rawRows1 = ImmutableList.of(
+          ImmutableMap.<String, Object>builder()
+                      .put("t", "2000-01-01")
+                      .put("col1", "foo")
+                      .put("col2", "bar")
+                      .build()
+      );
+      final List<InputRow> rows1 =
+          rawRows1
+              .stream()
+              .map(mapInputRow -> MapInputRowParser.parse(
+                  new InputRowSchema(
+                      new TimestampSpec("t", "iso", null),
+                      new DimensionsSpec(
+                          DimensionsSpec.getDefaultSchemas(ImmutableList.of("col1", "col2"))
+                      ),
+                      null
+                  ),
+                  mapInputRow
+              ))
+              .collect(Collectors.toList());
+      final QueryableIndex queryableIndex1 = IndexBuilder
+          .create()
+          .tmpDir(new File(tmpFolder, datasource1))
+          .segmentWriteOutMediumFactory(OnHeapMemorySegmentWriteOutMediumFactory.instance())
+          .schema(new IncrementalIndexSchema.Builder()
+                      .withRollup(false)
+                      .withDimensionsSpec(
+                          new DimensionsSpec(
+                              ImmutableList.of(
+                                  new StringDimensionSchema("col1"),
+                                  new StringDimensionSchema("col2")
+                              )
+                          )
+                      )
+                      .build()
+          )
+          .rows(rows1)
+          .buildMMappedIndex();
+
+      final List<ImmutableMap<String, Object>> rawRows2 = ImmutableList.of(
+          ImmutableMap.<String, Object>builder()
+                      .put("t", "2000-01-01")
+                      .put("col1", "abc")
+                      .put("col3", "def")
+                      .build()
+      );
+      final List<InputRow> rows2 =
+          rawRows2
+              .stream()
+              .map(mapInputRow -> MapInputRowParser.parse(
+                  new InputRowSchema(
+                      new TimestampSpec("t", "iso", null),
+                      new DimensionsSpec(
+                          DimensionsSpec.getDefaultSchemas(ImmutableList.of("col1", "col3"))
+                      ),
+                      null
+                  ),
+                  mapInputRow
+              ))
+              .collect(Collectors.toList());
+      final QueryableIndex queryableIndex2 = IndexBuilder
+          .create()
+          .tmpDir(new File(tmpFolder, datasource1))
+          .segmentWriteOutMediumFactory(OnHeapMemorySegmentWriteOutMediumFactory.instance())
+          .schema(new IncrementalIndexSchema.Builder()
+                      .withRollup(false)
+                      .withDimensionsSpec(
+                          new DimensionsSpec(
+                              ImmutableList.of(
+                                  new StringDimensionSchema("col1"),
+                                  new StringDimensionSchema("col3")
+                              )
+                          )
+                      )
+                      .build()
+          )
+          .rows(rows2)
+          .buildMMappedIndex();
+
+      walker.add(
+          DataSegment.builder()
+              .dataSource(datasource1)
+              .interval(Intervals.ETERNITY)
+              .version("1")
+              .shardSpec(new LinearShardSpec(0))
+              .size(0)
+              .build(),
+          queryableIndex1
+      );
+
+      walker.add(
+          DataSegment.builder()
+                     .dataSource(datasource1)
+                     .interval(Intervals.ETERNITY)
+                     .version("1")
+                     .shardSpec(new LinearShardSpec(1))
+                     .size(0)
+                     .build(),
+          queryableIndex2
+      );
+
+      return walker;
+    }
+  }
 }

From 641f739a47013143434f523cc255576bae1525f1 Mon Sep 17 00:00:00 2001
From: Akshat Jain <akjn11@gmail.com>
Date: Mon, 24 Jun 2024 08:13:47 +0530
Subject: [PATCH 11/72] Fix flaky test in RetryableS3OutputStreamTest (#16639)

As part of #16481, we have started uploading the chunks in parallel.
That means that it's not necessary for the part that finished uploading last
to be less than or equal to the chunkSize (as the final part could've been uploaded earlier).

This made a test in RetryableS3OutputStreamTest flaky where we were
asserting that the final part should be smaller than chunk size.

This commit fixes the test, and also adds another test where the file size
is such that all chunk sizes would be of equal size.
---
 .../output/RetryableS3OutputStreamTest.java   | 69 +++++++++----------
 1 file changed, 34 insertions(+), 35 deletions(-)

diff --git a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/RetryableS3OutputStreamTest.java b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/RetryableS3OutputStreamTest.java
index 8d15624c0d0..ead65a89f77 100644
--- a/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/RetryableS3OutputStreamTest.java
+++ b/extensions-core/s3-extensions/src/test/java/org/apache/druid/storage/s3/output/RetryableS3OutputStreamTest.java
@@ -115,12 +115,8 @@ public class RetryableS3OutputStreamTest
   {
     chunkSize = 10;
     ByteBuffer bb = ByteBuffer.allocate(Integer.BYTES);
-    try (RetryableS3OutputStream out = new RetryableS3OutputStream(
-        config,
-        s3,
-        path,
-        s3UploadManager
-    )) {
+    try (RetryableS3OutputStream out =
+             new RetryableS3OutputStream(config, s3, path, s3UploadManager)) {
       for (int i = 0; i < 25; i++) {
         bb.clear();
         bb.putInt(i);
@@ -137,12 +133,8 @@ public class RetryableS3OutputStreamTest
   {
     chunkSize = 10;
     ByteBuffer bb = ByteBuffer.allocate(Integer.BYTES * 3);
-    try (RetryableS3OutputStream out = new RetryableS3OutputStream(
-        config,
-        s3,
-        path,
-        s3UploadManager
-    )) {
+    try (RetryableS3OutputStream out =
+             new RetryableS3OutputStream(config, s3, path, s3UploadManager)) {
       bb.clear();
       bb.putInt(1);
       bb.putInt(2);
@@ -158,12 +150,8 @@ public class RetryableS3OutputStreamTest
   public void testWriteSmallBufferShouldSucceed() throws IOException
   {
     chunkSize = 128;
-    try (RetryableS3OutputStream out = new RetryableS3OutputStream(
-        config,
-        s3,
-        path,
-        s3UploadManager
-    )) {
+    try (RetryableS3OutputStream out =
+             new RetryableS3OutputStream(config, s3, path, s3UploadManager)) {
       for (int i = 0; i < 600; i++) {
         out.write(i);
       }
@@ -173,6 +161,22 @@ public class RetryableS3OutputStreamTest
     s3.assertCompleted(chunkSize, 600);
   }
 
+  @Test
+  public void testWriteSmallBufferExactChunkSizeShouldSucceed() throws IOException
+  {
+    chunkSize = 128;
+    final int fileSize = 128 * 5;
+    try (RetryableS3OutputStream out =
+             new RetryableS3OutputStream(config, s3, path, s3UploadManager)) {
+      for (int i = 0; i < fileSize; i++) {
+        out.write(i);
+      }
+    }
+    // each chunk 128 bytes, so there should be 5 chunks.
+    Assert.assertEquals(5, s3.partRequests.size());
+    s3.assertCompleted(chunkSize, fileSize);
+  }
+
   @Test
   public void testSuccessToUploadAfterRetry() throws IOException
   {
@@ -180,12 +184,8 @@ public class RetryableS3OutputStreamTest
 
     chunkSize = 10;
     ByteBuffer bb = ByteBuffer.allocate(Integer.BYTES);
-    try (RetryableS3OutputStream out = new RetryableS3OutputStream(
-        config,
-        s3,
-        path,
-        s3UploadManager
-    )) {
+    try (RetryableS3OutputStream out =
+             new RetryableS3OutputStream(config, s3, path, s3UploadManager)) {
       for (int i = 0; i < 25; i++) {
         bb.clear();
         bb.putInt(i);
@@ -203,12 +203,8 @@ public class RetryableS3OutputStreamTest
     final TestAmazonS3 s3 = new TestAmazonS3(3);
 
     ByteBuffer bb = ByteBuffer.allocate(Integer.BYTES);
-    try (RetryableS3OutputStream out = new RetryableS3OutputStream(
-        config,
-        s3,
-        path,
-        s3UploadManager
-    )) {
+    try (RetryableS3OutputStream out =
+             new RetryableS3OutputStream(config, s3, path, s3UploadManager)) {
       for (int i = 0; i < 2; i++) {
         bb.clear();
         bb.putInt(i);
@@ -286,13 +282,16 @@ public class RetryableS3OutputStreamTest
       Set<Integer> partNumbersFromRequest = partRequests.stream().map(UploadPartRequest::getPartNumber).collect(Collectors.toSet());
       Assert.assertEquals(partRequests.size(), partNumbersFromRequest.size());
 
-      for (int i = 0; i < partRequests.size(); i++) {
-        if (i < partRequests.size() - 1) {
-          Assert.assertEquals(chunkSize, partRequests.get(i).getPartSize());
-        } else {
-          Assert.assertTrue(chunkSize >= partRequests.get(i).getPartSize());
+      // Verify sizes of uploaded chunks
+      int numSmallerChunks = 0;
+      for (UploadPartRequest part : partRequests) {
+        Assert.assertTrue(part.getPartSize() <= chunkSize);
+        if (part.getPartSize() < chunkSize) {
+          ++numSmallerChunks;
         }
       }
+      Assert.assertTrue(numSmallerChunks <= 1);
+
       final List<PartETag> eTags = completeRequest.getPartETags();
       Assert.assertEquals(partRequests.size(), eTags.size());
       Assert.assertEquals(

From 1a883ba1f7b6f6ccc8f166658347ea88c5c61639 Mon Sep 17 00:00:00 2001
From: Adarsh Sanjeev <adarshsanjeev@gmail.com>
Date: Mon, 24 Jun 2024 09:03:30 +0530
Subject: [PATCH 12/72] Fix complex columns with export (#16572)

This PR fixes a few bugs with MSQ export. The main change is calling SqlResults#coerce before writing the column. This allows sketches and json to be correctly deserialized. The format of the exported complex columns are similar to those produced by Async MSQ queries with CSV format.

Notes:

    Fix printing of complex columns during export. Sketches and JSON are now correctly formatted during export.
    Fix an NPE if the writer has not been initialized. Empty export queries will create an empty file at the location.
    Fix a bug with counters for MSQ export, where rows were reported for only the first partition.
---
 .../druid/msq/counters/ChannelCounters.java   |   7 +-
 .../apache/druid/msq/exec/ControllerImpl.java |   9 +-
 .../apache/druid/msq/exec/ResultsContext.java |   9 +-
 .../results/ExportResultsFrameProcessor.java  |  34 +++-
 .../ExportResultsFrameProcessorFactory.java   |  20 ++-
 .../apache/druid/msq/exec/MSQExportTest.java  | 150 +++++++++++++++++-
 .../msq/exec/ResultsContextSerdeTest.java     | 107 +++++++++++++
 ...xportResultsFrameProcessorFactoryTest.java |   1 +
 .../apache/druid/msq/test/MSQTestBase.java    |   1 +
 9 files changed, 318 insertions(+), 20 deletions(-)
 create mode 100644 extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/ResultsContextSerdeTest.java

diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/counters/ChannelCounters.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/counters/ChannelCounters.java
index 3578fa21a6e..1cf017635a6 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/counters/ChannelCounters.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/counters/ChannelCounters.java
@@ -55,7 +55,12 @@ public class ChannelCounters implements QueryCounter
 
   public void incrementRowCount()
   {
-    add(NO_PARTITION, 1, 0, 0, 0);
+    incrementRowCount(NO_PARTITION);
+  }
+
+  public void incrementRowCount(int partition)
+  {
+    add(partition, 1, 0, 0, 0);
   }
 
   public void incrementBytes(long bytes)
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
index 72728c60564..b6541c7f26a 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
@@ -582,7 +582,8 @@ public class ControllerImpl implements Controller
         queryId(),
         makeQueryControllerToolKit(),
         querySpec,
-        context.jsonMapper()
+        context.jsonMapper(),
+        resultsContext
     );
 
     if (log.isDebugEnabled()) {
@@ -1673,7 +1674,8 @@ public class ControllerImpl implements Controller
       final String queryId,
       @SuppressWarnings("rawtypes") final QueryKit toolKit,
       final MSQSpec querySpec,
-      final ObjectMapper jsonMapper
+      final ObjectMapper jsonMapper,
+      final ResultsContext resultsContext
   )
   {
     final MSQTuningConfig tuningConfig = querySpec.getTuningConfig();
@@ -1836,7 +1838,8 @@ public class ControllerImpl implements Controller
                                      queryId,
                                      exportStorageProvider,
                                      resultFormat,
-                                     columnMappings
+                                     columnMappings,
+                                     resultsContext
                                  ))
       );
       return builder.build();
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ResultsContext.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ResultsContext.java
index 9e565bb75a5..209113f080a 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ResultsContext.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ResultsContext.java
@@ -19,6 +19,8 @@
 
 package org.apache.druid.msq.exec;
 
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
 import org.apache.calcite.sql.type.SqlTypeName;
 import org.apache.druid.sql.calcite.run.SqlResults;
 
@@ -34,21 +36,24 @@ public class ResultsContext
   private final List<SqlTypeName> sqlTypeNames;
   private final SqlResults.Context sqlResultsContext;
 
+  @JsonCreator
   public ResultsContext(
-      final List<SqlTypeName> sqlTypeNames,
-      final SqlResults.Context sqlResultsContext
+      @JsonProperty("sqlTypeNames") final List<SqlTypeName> sqlTypeNames,
+      @JsonProperty("sqlResultsContext") final SqlResults.Context sqlResultsContext
   )
   {
     this.sqlTypeNames = sqlTypeNames;
     this.sqlResultsContext = sqlResultsContext;
   }
 
+  @JsonProperty("sqlTypeNames")
   @Nullable
   public List<SqlTypeName> getSqlTypeNames()
   {
     return sqlTypeNames;
   }
 
+  @JsonProperty("sqlResultsContext")
   @Nullable
   public SqlResults.Context getSqlResultsContext()
   {
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessor.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessor.java
index e3635338231..ccedf0402c6 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessor.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessor.java
@@ -36,6 +36,7 @@ import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.java.util.common.guava.Sequence;
 import org.apache.druid.msq.counters.ChannelCounters;
+import org.apache.druid.msq.exec.ResultsContext;
 import org.apache.druid.msq.util.SequenceUtils;
 import org.apache.druid.segment.BaseObjectColumnValueSelector;
 import org.apache.druid.segment.ColumnSelectorFactory;
@@ -44,6 +45,7 @@ import org.apache.druid.segment.VirtualColumns;
 import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.sql.calcite.planner.ColumnMapping;
 import org.apache.druid.sql.calcite.planner.ColumnMappings;
+import org.apache.druid.sql.calcite.run.SqlResults;
 import org.apache.druid.sql.http.ResultFormat;
 import org.apache.druid.storage.StorageConnector;
 
@@ -64,6 +66,8 @@ public class ExportResultsFrameProcessor implements FrameProcessor<Object>
   private final String exportFilePath;
   private final Object2IntMap<String> outputColumnNameToFrameColumnNumberMap;
   private final RowSignature exportRowSignature;
+  private final ResultsContext resultsContext;
+  private final int partitionNum;
 
   private volatile ResultFormat.Writer exportWriter;
 
@@ -75,7 +79,9 @@ public class ExportResultsFrameProcessor implements FrameProcessor<Object>
       final ObjectMapper jsonMapper,
       final ChannelCounters channelCounter,
       final String exportFilePath,
-      final ColumnMappings columnMappings
+      final ColumnMappings columnMappings,
+      final ResultsContext resultsContext,
+      final int partitionNum
   )
   {
     this.inputChannel = inputChannel;
@@ -85,6 +91,8 @@ public class ExportResultsFrameProcessor implements FrameProcessor<Object>
     this.jsonMapper = jsonMapper;
     this.channelCounter = channelCounter;
     this.exportFilePath = exportFilePath;
+    this.resultsContext = resultsContext;
+    this.partitionNum = partitionNum;
     this.outputColumnNameToFrameColumnNumberMap = new Object2IntOpenHashMap<>();
     final RowSignature inputRowSignature = frameReader.signature();
 
@@ -130,13 +138,13 @@ public class ExportResultsFrameProcessor implements FrameProcessor<Object>
       return ReturnOrAwait.awaitAll(1);
     }
 
+    if (exportWriter == null) {
+      createExportWriter();
+    }
     if (inputChannel.isFinished()) {
       exportWriter.writeResponseEnd();
       return ReturnOrAwait.returnObject(exportFilePath);
     } else {
-      if (exportWriter == null) {
-        createExportWriter();
-      }
       exportFrame(inputChannel.read());
       return ReturnOrAwait.awaitAll(1);
     }
@@ -167,9 +175,23 @@ public class ExportResultsFrameProcessor implements FrameProcessor<Object>
               for (int j = 0; j < exportRowSignature.size(); j++) {
                 String columnName = exportRowSignature.getColumnName(j);
                 BaseObjectColumnValueSelector<?> selector = selectors.get(outputColumnNameToFrameColumnNumberMap.getInt(columnName));
-                exportWriter.writeRowField(columnName, selector.getObject());
+                if (resultsContext == null) {
+                  throw DruidException.forPersona(DruidException.Persona.OPERATOR)
+                                      .ofCategory(DruidException.Category.RUNTIME_FAILURE)
+                                      .build("Received null resultsContext from the controller. This is due to a version mismatch between the controller and the worker. Please ensure that the worker and the controller are on the same version before retrying the query.");
+                }
+                exportWriter.writeRowField(
+                    columnName,
+                    SqlResults.coerce(
+                        jsonMapper,
+                        resultsContext.getSqlResultsContext(),
+                        selector.getObject(),
+                        resultsContext.getSqlTypeNames().get(j),
+                        columnName
+                    )
+                );
               }
-              channelCounter.incrementRowCount();
+              channelCounter.incrementRowCount(partitionNum);
               exportWriter.writeRowEnd();
               cursor.advance();
             }
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactory.java
index beb626f0fce..af4038cd247 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactory.java
@@ -36,6 +36,7 @@ import org.apache.druid.java.util.common.guava.Sequences;
 import org.apache.druid.msq.counters.ChannelCounters;
 import org.apache.druid.msq.counters.CounterNames;
 import org.apache.druid.msq.counters.CounterTracker;
+import org.apache.druid.msq.exec.ResultsContext;
 import org.apache.druid.msq.input.InputSlice;
 import org.apache.druid.msq.input.InputSliceReader;
 import org.apache.druid.msq.input.ReadableInput;
@@ -63,19 +64,22 @@ public class ExportResultsFrameProcessorFactory implements FrameProcessorFactory
   private final ExportStorageProvider exportStorageProvider;
   private final ResultFormat exportFormat;
   private final ColumnMappings columnMappings;
+  private final ResultsContext resultsContext;
 
   @JsonCreator
   public ExportResultsFrameProcessorFactory(
       @JsonProperty("queryId") String queryId,
       @JsonProperty("exportStorageProvider") ExportStorageProvider exportStorageProvider,
       @JsonProperty("exportFormat") ResultFormat exportFormat,
-      @JsonProperty("columnMappings") @Nullable ColumnMappings columnMappings
+      @JsonProperty("columnMappings") @Nullable ColumnMappings columnMappings,
+      @JsonProperty("resultsContext") @Nullable ResultsContext resultsContext
   )
   {
     this.queryId = queryId;
     this.exportStorageProvider = exportStorageProvider;
     this.exportFormat = exportFormat;
     this.columnMappings = columnMappings;
+    this.resultsContext = resultsContext;
   }
 
   @JsonProperty("queryId")
@@ -105,6 +109,14 @@ public class ExportResultsFrameProcessorFactory implements FrameProcessorFactory
     return columnMappings;
   }
 
+  @JsonProperty("resultsContext")
+  @JsonInclude(JsonInclude.Include.NON_NULL)
+  @Nullable
+  public ResultsContext getResultsContext()
+  {
+    return resultsContext;
+  }
+
   @Override
   public ProcessorsAndChannels<Object, Object> makeProcessors(
       StageDefinition stageDefinition,
@@ -132,7 +144,7 @@ public class ExportResultsFrameProcessorFactory implements FrameProcessorFactory
       );
     }
 
-    ChannelCounters channelCounter = counters.channel(CounterNames.outputChannel());
+    final ChannelCounters channelCounter = counters.channel(CounterNames.outputChannel());
     final Sequence<ReadableInput> readableInputs =
         Sequences.simple(inputSliceReader.attach(0, slice, counters, warningPublisher));
 
@@ -145,7 +157,9 @@ public class ExportResultsFrameProcessorFactory implements FrameProcessorFactory
             frameContext.jsonMapper(),
             channelCounter,
             getExportFilePath(queryId, workerNumber, readableInput.getStagePartition().getPartitionNumber(), exportFormat),
-            columnMappings
+            columnMappings,
+            resultsContext,
+            readableInput.getStagePartition().getPartitionNumber()
         )
     );
 
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQExportTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQExportTest.java
index edc98dcea98..71b816e78c5 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQExportTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQExportTest.java
@@ -62,8 +62,8 @@ public class MSQExportTest extends MSQTestBase
                      .verifyResults();
 
     Assert.assertEquals(
-         2, // result file and manifest file
-        Objects.requireNonNull(new File(exportDir.getAbsolutePath()).listFiles()).length
+        2, // result file and manifest file
+        Objects.requireNonNull(exportDir.listFiles()).length
     );
 
     File resultFile = new File(exportDir, "query-test-query-worker0-partition0.csv");
@@ -81,7 +81,7 @@ public class MSQExportTest extends MSQTestBase
                                             .add("dim1", ColumnType.STRING)
                                             .add("cnt", ColumnType.LONG).build();
 
-    File exportDir = newTempFolder("export");
+    final File exportDir = newTempFolder("export");
     final String sql = StringUtils.format("insert into extern(local(exportPath=>'%s')) as csv select dim1 as table_dim, count(*) as table_count from foo where dim1 = 'abc' group by 1", exportDir.getAbsolutePath());
 
     testIngestQuery().setSql(sql)
@@ -94,7 +94,7 @@ public class MSQExportTest extends MSQTestBase
 
     Assert.assertEquals(
         2,
-        Objects.requireNonNull(new File(exportDir.getAbsolutePath()).listFiles()).length
+        Objects.requireNonNull(exportDir.listFiles()).length
     );
 
 
@@ -133,7 +133,147 @@ public class MSQExportTest extends MSQTestBase
 
     Assert.assertEquals(
         expectedFooFileContents(false).size() + 1, // + 1 for the manifest file
-        Objects.requireNonNull(new File(exportDir.getAbsolutePath()).listFiles()).length
+        Objects.requireNonNull(exportDir.listFiles()).length
+    );
+  }
+
+  @Test
+  void testExportComplexColumns() throws IOException
+  {
+    final RowSignature rowSignature = RowSignature.builder()
+                                                  .add("__time", ColumnType.LONG)
+                                                  .add("a", ColumnType.LONG)
+                                                  .add("b", ColumnType.LONG)
+                                                  .add("c_json", ColumnType.STRING).build();
+
+    final File exportDir = newTempFolder("export");
+    final String sql = StringUtils.format("INSERT INTO\n"
+                                          + "EXTERN(local(exportPath=>'%s'))\n"
+                                          + "AS CSV\n"
+                                          + "SELECT\n"
+                                          + "  \"a\",\n"
+                                          + "  \"b\",\n"
+                                          + "  json_object(key 'c' value b) c_json\n"
+                                          + "FROM (\n"
+                                          + "  SELECT *\n"
+                                          + "  FROM TABLE(\n"
+                                          + "    EXTERN(\n"
+                                          + "      '{\"type\":\"inline\",\"data\":\"a,b\\n1,1\\n2,2\"}',\n"
+                                          + "      '{\"type\":\"csv\",\"findColumnsFromHeader\":true}'\n"
+                                          + "    )\n"
+                                          + "  ) EXTEND (\"a\" BIGINT, \"b\" BIGINT)\n"
+                                          + ")", exportDir.getAbsolutePath());
+
+    testIngestQuery().setSql(sql)
+                     .setExpectedDataSource("foo1")
+                     .setQueryContext(DEFAULT_MSQ_CONTEXT)
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedSegment(ImmutableSet.of())
+                     .setExpectedResultRows(ImmutableList.of())
+                     .verifyResults();
+
+    Assert.assertEquals(
+        2, // result file and manifest file
+        Objects.requireNonNull(exportDir.listFiles()).length
+    );
+
+    File resultFile = new File(exportDir, "query-test-query-worker0-partition0.csv");
+    List<String> results = readResultsFromFile(resultFile);
+    Assert.assertEquals(
+        ImmutableList.of(
+            "a,b,c_json", "1,1,\"{\"\"c\"\":1}\"", "2,2,\"{\"\"c\"\":2}\""
+        ),
+        results
+    );
+  }
+
+  @Test
+  void testExportSketchColumns() throws IOException
+  {
+    final RowSignature rowSignature = RowSignature.builder()
+                                                  .add("__time", ColumnType.LONG)
+                                                  .add("a", ColumnType.LONG)
+                                                  .add("b", ColumnType.LONG)
+                                                  .add("c_json", ColumnType.STRING).build();
+
+    final File exportDir = newTempFolder("export");
+    final String sql = StringUtils.format("INSERT INTO\n"
+                                          + "EXTERN(local(exportPath=>'%s'))\n"
+                                          + "AS CSV\n"
+                                          + "SELECT\n"
+                                          + "  \"a\",\n"
+                                          + "  \"b\",\n"
+                                          + "  ds_hll(b) c_ds_hll\n"
+                                          + "FROM (\n"
+                                          + "  SELECT *\n"
+                                          + "  FROM TABLE(\n"
+                                          + "    EXTERN(\n"
+                                          + "      '{\"type\":\"inline\",\"data\":\"a,b\\n1,b1\\n2,b2\"}',\n"
+                                          + "      '{\"type\":\"csv\",\"findColumnsFromHeader\":true}'\n"
+                                          + "    )\n"
+                                          + "  ) EXTEND (\"a\" BIGINT, \"b\" VARCHAR)\n"
+                                          + ")\n"
+                                          + "GROUP BY 1,2", exportDir.getAbsolutePath());
+
+    testIngestQuery().setSql(sql)
+                     .setExpectedDataSource("foo1")
+                     .setQueryContext(DEFAULT_MSQ_CONTEXT)
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedSegment(ImmutableSet.of())
+                     .setExpectedResultRows(ImmutableList.of())
+                     .verifyResults();
+
+    Assert.assertEquals(
+        2, // result file and manifest file
+        Objects.requireNonNull(exportDir.listFiles()).length
+    );
+
+    File resultFile = new File(exportDir, "query-test-query-worker0-partition0.csv");
+    List<String> results = readResultsFromFile(resultFile);
+    Assert.assertEquals(
+        ImmutableList.of(
+            "a,b,c_ds_hll", "1,b1,\"\"\"AgEHDAMIAQBa1y0L\"\"\"", "2,b2,\"\"\"AgEHDAMIAQCi6V0G\"\"\""
+        ),
+        results
+    );
+  }
+
+  @Test
+  void testEmptyExport() throws IOException
+  {
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("dim1", ColumnType.STRING)
+                                            .add("cnt", ColumnType.LONG).build();
+
+    File exportDir = newTempFolder("export");
+    final String sql = StringUtils.format("INSERT INTO "
+                                          + "EXTERN(local(exportPath=>'%s'))"
+                                          + "AS CSV "
+                                          + "SELECT cnt, dim1 AS dim "
+                                          + "FROM foo "
+                                          + "WHERE dim1='nonexistentvalue'", exportDir.getAbsolutePath());
+
+    testIngestQuery().setSql(sql)
+                     .setExpectedDataSource("foo1")
+                     .setQueryContext(DEFAULT_MSQ_CONTEXT)
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedSegment(ImmutableSet.of())
+                     .setExpectedResultRows(ImmutableList.of())
+                     .verifyResults();
+
+    Assert.assertEquals(
+        2, // result file and manifest file
+        Objects.requireNonNull(exportDir.listFiles()).length
+    );
+
+    File resultFile = new File(exportDir, "query-test-query-worker0-partition0.csv");
+    List<String> results = readResultsFromFile(resultFile);
+    Assert.assertEquals(
+        ImmutableList.of(
+            "cnt,dim"
+        ),
+        results
     );
   }
 
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/ResultsContextSerdeTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/ResultsContextSerdeTest.java
new file mode 100644
index 00000000000..b6023392576
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/ResultsContextSerdeTest.java
@@ -0,0 +1,107 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.exec;
+
+import com.fasterxml.jackson.core.JsonProcessingException;
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+import com.google.common.collect.ImmutableSet;
+import org.apache.calcite.schema.SchemaPlus;
+import org.apache.calcite.sql.type.SqlTypeName;
+import org.apache.druid.jackson.DefaultObjectMapper;
+import org.apache.druid.query.QueryRunnerFactoryConglomerate;
+import org.apache.druid.query.QuerySegmentWalker;
+import org.apache.druid.server.security.AuthConfig;
+import org.apache.druid.sql.calcite.planner.CalciteRulesManager;
+import org.apache.druid.sql.calcite.planner.CatalogResolver;
+import org.apache.druid.sql.calcite.planner.PlannerConfig;
+import org.apache.druid.sql.calcite.planner.PlannerContext;
+import org.apache.druid.sql.calcite.planner.PlannerToolbox;
+import org.apache.druid.sql.calcite.run.NativeSqlEngine;
+import org.apache.druid.sql.calcite.run.SqlResults;
+import org.apache.druid.sql.calcite.schema.DruidSchema;
+import org.apache.druid.sql.calcite.schema.DruidSchemaCatalog;
+import org.apache.druid.sql.calcite.schema.NamedDruidSchema;
+import org.apache.druid.sql.calcite.schema.NamedViewSchema;
+import org.apache.druid.sql.calcite.schema.ViewSchema;
+import org.apache.druid.sql.calcite.util.CalciteTests;
+import org.easymock.EasyMock;
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Test;
+
+import java.util.Collections;
+
+public class ResultsContextSerdeTest
+{
+  private ResultsContext resultsContext;
+  private ObjectMapper objectMapper;
+
+  @Before
+  public void setUp()
+  {
+    final PlannerToolbox toolbox = new PlannerToolbox(
+        CalciteTests.createOperatorTable(),
+        CalciteTests.createExprMacroTable(),
+        CalciteTests.getJsonMapper(),
+        new PlannerConfig(),
+        new DruidSchemaCatalog(
+            EasyMock.createMock(SchemaPlus.class),
+            ImmutableMap.of(
+                "druid", new NamedDruidSchema(EasyMock.createMock(DruidSchema.class), "druid"),
+                NamedViewSchema.NAME, new NamedViewSchema(EasyMock.createMock(ViewSchema.class))
+            )
+        ),
+        CalciteTests.createJoinableFactoryWrapper(),
+        CatalogResolver.NULL_RESOLVER,
+        "druid",
+        new CalciteRulesManager(ImmutableSet.of()),
+        CalciteTests.TEST_AUTHORIZER_MAPPER,
+        AuthConfig.newBuilder().build()
+    );
+    final NativeSqlEngine engine = CalciteTests.createMockSqlEngine(
+        EasyMock.createMock(QuerySegmentWalker.class),
+        EasyMock.createMock(QueryRunnerFactoryConglomerate.class)
+    );
+
+    PlannerContext plannerContext = PlannerContext.create(
+        toolbox,
+        "DUMMY",
+        engine,
+        Collections.emptyMap(),
+        null
+    );
+    this.resultsContext = new ResultsContext(
+        ImmutableList.of(SqlTypeName.DOUBLE, SqlTypeName.TIMESTAMP, SqlTypeName.VARCHAR),
+        SqlResults.Context.fromPlannerContext(plannerContext)
+    );
+    this.objectMapper = new DefaultObjectMapper();
+  }
+
+  @Test
+  public void testSerde() throws JsonProcessingException
+  {
+    String s = objectMapper.writeValueAsString(resultsContext);
+
+    ResultsContext deserialized = objectMapper.readValue(s, ResultsContext.class);
+    Assert.assertEquals(resultsContext, deserialized);
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactoryTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactoryTest.java
index 90f19164770..6fed86035d6 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactoryTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactoryTest.java
@@ -48,5 +48,6 @@ public class ExportResultsFrameProcessorFactoryTest
         ExportResultsFrameProcessorFactory.class
     );
     Assert.assertNull(exportResultsFrameProcessorFactory.getColumnMappings());
+    Assert.assertNull(exportResultsFrameProcessorFactory.getResultsContext());
   }
 }
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
index 8ce22876647..33c1374d2a7 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
@@ -530,6 +530,7 @@ public class MSQTestBase extends BaseCalciteQueryTest
     objectMapper = setupObjectMapper(injector);
     objectMapper.registerModules(new StorageConnectorModule().getJacksonModules());
     objectMapper.registerModules(sqlModule.getJacksonModules());
+    objectMapper.registerModules(NestedDataModule.getJacksonModulesList());
 
     doReturn(mock(Request.class)).when(brokerClient).makeRequest(any(), anyString());
 

From 0fe6a2af68d8bd7d729bc2d2402c223809dca7e0 Mon Sep 17 00:00:00 2001
From: Kashif Faraz <kashif.faraz@gmail.com>
Date: Sun, 23 Jun 2024 21:26:04 -0700
Subject: [PATCH 13/72] Fix replica task failures with metadata inconsistency
 while running concurrent append replace (#16614)

Changes:
- Add new task action `RetrieveSegmentsByIdAction`
- Use new task action to retrieve segments irrespective of their visibility
- During rolling upgrades, this task action would fail as Overlord would be on old version
- If new action fails, fall back to just fetching used segments as before
---
 .../ActionBasedUsedSegmentChecker.java        |  76 +++++---
 .../actions/RetrieveSegmentsByIdAction.java   | 110 +++++++++++
 .../indexing/common/actions/TaskAction.java   |   3 +-
 .../ActionBasedUsedSegmentCheckerTest.java    | 184 +++++++++---------
 ...TestIndexerMetadataStorageCoordinator.java |   6 +
 .../IndexerMetadataStorageCoordinator.java    |   6 +
 .../IndexerSQLMetadataStorageCoordinator.java |  12 ++
 .../appenderator/BaseAppenderatorDriver.java  |  37 ++--
 .../SegmentsAndCommitMetadata.java            |   9 -
 .../appenderator/UsedSegmentChecker.java      |   7 +-
 .../StreamAppenderatorDriverFailTest.java     |   3 +-
 .../appenderator/TestUsedSegmentChecker.java  |   9 +-
 12 files changed, 309 insertions(+), 153 deletions(-)
 create mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveSegmentsByIdAction.java

diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentChecker.java b/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentChecker.java
index 3a33bc80d68..2a7d5610cca 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentChecker.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentChecker.java
@@ -20,10 +20,13 @@
 package org.apache.druid.indexing.appenderator;
 
 import com.google.common.collect.Iterables;
+import org.apache.druid.error.InvalidInput;
+import org.apache.druid.indexing.common.actions.RetrieveSegmentsByIdAction;
 import org.apache.druid.indexing.common.actions.RetrieveUsedSegmentsAction;
 import org.apache.druid.indexing.common.actions.TaskActionClient;
+import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.java.util.common.JodaUtils;
-import org.apache.druid.segment.realtime.appenderator.SegmentIdWithShardSpec;
+import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.segment.realtime.appenderator.UsedSegmentChecker;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.SegmentId;
@@ -31,14 +34,16 @@ import org.joda.time.Interval;
 
 import java.io.IOException;
 import java.util.Collection;
+import java.util.Collections;
 import java.util.HashSet;
 import java.util.List;
-import java.util.Map;
 import java.util.Set;
-import java.util.TreeMap;
+import java.util.stream.Collectors;
 
 public class ActionBasedUsedSegmentChecker implements UsedSegmentChecker
 {
+  private static final Logger log = new Logger(ActionBasedUsedSegmentChecker.class);
+
   private final TaskActionClient taskActionClient;
 
   public ActionBasedUsedSegmentChecker(TaskActionClient taskActionClient)
@@ -47,33 +52,54 @@ public class ActionBasedUsedSegmentChecker implements UsedSegmentChecker
   }
 
   @Override
-  public Set<DataSegment> findUsedSegments(Set<SegmentIdWithShardSpec> segmentIds) throws IOException
+  public Set<DataSegment> findPublishedSegments(Set<SegmentId> segmentIds) throws IOException
   {
-    // Group by dataSource
-    final Map<String, Set<SegmentId>> idsByDataSource = new TreeMap<>();
-    for (SegmentIdWithShardSpec segmentId : segmentIds) {
-      idsByDataSource.computeIfAbsent(segmentId.getDataSource(), i -> new HashSet<>()).add(segmentId.asSegmentId());
+    if (segmentIds == null || segmentIds.isEmpty()) {
+      return Collections.emptySet();
     }
 
-    final Set<DataSegment> usedSegments = new HashSet<>();
-
-    for (Map.Entry<String, Set<SegmentId>> entry : idsByDataSource.entrySet()) {
-      String dataSource = entry.getKey();
-      Set<SegmentId> segmentIdsInDataSource = entry.getValue();
-      final List<Interval> intervals = JodaUtils.condenseIntervals(
-          Iterables.transform(segmentIdsInDataSource, SegmentId::getInterval)
-      );
-
-      final Collection<DataSegment> usedSegmentsForIntervals = taskActionClient
-          .submit(new RetrieveUsedSegmentsAction(dataSource, intervals));
-
-      for (DataSegment segment : usedSegmentsForIntervals) {
-        if (segmentIdsInDataSource.contains(segment.getId())) {
-          usedSegments.add(segment);
-        }
+    // Validate that all segments belong to the same datasource
+    final String dataSource = segmentIds.iterator().next().getDataSource();
+    for (SegmentId segmentId : segmentIds) {
+      if (!segmentId.getDataSource().equals(dataSource)) {
+        throw InvalidInput.exception(
+            "Published segment IDs to find cannot belong to multiple datasources[%s, %s].",
+            dataSource, segmentId.getDataSource()
+        );
       }
     }
 
-    return usedSegments;
+    // Try to retrieve segments using new task action
+    final Set<String> serializedSegmentIds = segmentIds.stream()
+                                                       .map(SegmentId::toString)
+                                                       .collect(Collectors.toSet());
+    try {
+      return taskActionClient.submit(new RetrieveSegmentsByIdAction(dataSource, serializedSegmentIds));
+    }
+    catch (Exception e) {
+      log.warn(
+          e,
+          "Could not retrieve published segment IDs[%s] using task action[segmentListById]."
+          + " Overlord maybe on an older version, retrying with action[segmentListUsed]."
+          + " This task may fail to publish segments if there is a concurrent replace happening.",
+          serializedSegmentIds
+      );
+    }
+
+    // Fall back to using old task action if Overlord is still on an older version
+    final Set<DataSegment> publishedSegments = new HashSet<>();
+    final List<Interval> usedSearchIntervals = JodaUtils.condenseIntervals(
+        Iterables.transform(segmentIds, SegmentId::getInterval)
+    );
+    final Collection<DataSegment> foundUsedSegments = taskActionClient.submit(
+        new RetrieveUsedSegmentsAction(dataSource, null, usedSearchIntervals, Segments.INCLUDING_OVERSHADOWED)
+    );
+    for (DataSegment segment : foundUsedSegments) {
+      if (segmentIds.contains(segment.getId())) {
+        publishedSegments.add(segment);
+      }
+    }
+
+    return publishedSegments;
   }
 }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveSegmentsByIdAction.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveSegmentsByIdAction.java
new file mode 100644
index 00000000000..88d3703f4b0
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveSegmentsByIdAction.java
@@ -0,0 +1,110 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import com.fasterxml.jackson.core.type.TypeReference;
+import org.apache.druid.indexing.common.task.Task;
+import org.apache.druid.timeline.DataSegment;
+
+import java.util.Objects;
+import java.util.Set;
+
+/**
+ * Task action to retrieve segments from the metadata store. Matching segments
+ * are returned regardless of their visibility i.e. visible, overshadowed or unused.
+ */
+public class RetrieveSegmentsByIdAction implements TaskAction<Set<DataSegment>>
+{
+  private final String dataSource;
+  private final Set<String> segmentIds;
+
+  @JsonCreator
+  public RetrieveSegmentsByIdAction(
+      @JsonProperty("dataSource") String dataSource,
+      @JsonProperty("segmentIds") Set<String> segmentIds
+  )
+  {
+    this.dataSource = dataSource;
+    this.segmentIds = segmentIds;
+  }
+
+  @JsonProperty
+  public String getDataSource()
+  {
+    return dataSource;
+  }
+
+  @JsonProperty
+  public Set<String> getSegmentIds()
+  {
+    return segmentIds;
+  }
+
+  @Override
+  public TypeReference<Set<DataSegment>> getReturnTypeReference()
+  {
+    return new TypeReference<Set<DataSegment>>()
+    {
+    };
+  }
+
+  @Override
+  public Set<DataSegment> perform(Task task, TaskActionToolbox toolbox)
+  {
+    return toolbox.getIndexerMetadataStorageCoordinator()
+                  .retrieveSegmentsById(dataSource, segmentIds);
+  }
+
+  @Override
+  public boolean isAudited()
+  {
+    return false;
+  }
+
+  @Override
+  public boolean equals(Object o)
+  {
+    if (this == o) {
+      return true;
+    }
+    if (o == null || getClass() != o.getClass()) {
+      return false;
+    }
+    RetrieveSegmentsByIdAction that = (RetrieveSegmentsByIdAction) o;
+    return Objects.equals(dataSource, that.dataSource) && Objects.equals(segmentIds, that.segmentIds);
+  }
+
+  @Override
+  public int hashCode()
+  {
+    return Objects.hash(dataSource, segmentIds);
+  }
+
+  @Override
+  public String toString()
+  {
+    return getClass().getSimpleName() + "{" +
+           "dataSource='" + dataSource + '\'' +
+           ", segmentIds=" + segmentIds +
+           '}';
+  }
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
index 171d53b9cdd..7ab0b946cd8 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
@@ -38,9 +38,8 @@ import java.util.concurrent.Future;
     @JsonSubTypes.Type(name = "segmentTransactionalInsert", value = SegmentTransactionalInsertAction.class),
     @JsonSubTypes.Type(name = "segmentTransactionalAppend", value = SegmentTransactionalAppendAction.class),
     @JsonSubTypes.Type(name = "segmentTransactionalReplace", value = SegmentTransactionalReplaceAction.class),
-    // Type name doesn't correspond to the name of the class for backward compatibility.
+    @JsonSubTypes.Type(name = "segmentListById", value = RetrieveSegmentsByIdAction.class),
     @JsonSubTypes.Type(name = "segmentListUsed", value = RetrieveUsedSegmentsAction.class),
-    // Type name doesn't correspond to the name of the class for backward compatibility.
     @JsonSubTypes.Type(name = "segmentListUnused", value = RetrieveUnusedSegmentsAction.class),
     @JsonSubTypes.Type(name = "markSegmentsAsUnused", value = MarkSegmentsAsUnusedAction.class),
     @JsonSubTypes.Type(name = "segmentNuke", value = SegmentNukeAction.class),
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentCheckerTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentCheckerTest.java
index c339a103b2d..160176c8841 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentCheckerTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentCheckerTest.java
@@ -19,120 +19,124 @@
 
 package org.apache.druid.indexing.appenderator;
 
-import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableSet;
+import org.apache.druid.error.DruidException;
+import org.apache.druid.error.InvalidInput;
+import org.apache.druid.indexing.common.actions.RetrieveSegmentsByIdAction;
 import org.apache.druid.indexing.common.actions.RetrieveUsedSegmentsAction;
 import org.apache.druid.indexing.common.actions.TaskActionClient;
+import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.segment.realtime.appenderator.SegmentIdWithShardSpec;
-import org.apache.druid.segment.realtime.appenderator.UsedSegmentChecker;
+import org.apache.druid.java.util.common.granularity.Granularities;
+import org.apache.druid.server.coordinator.CreateDataSegments;
 import org.apache.druid.timeline.DataSegment;
-import org.apache.druid.timeline.partition.LinearShardSpec;
+import org.apache.druid.timeline.SegmentId;
 import org.easymock.EasyMock;
 import org.junit.Assert;
+import org.junit.Before;
 import org.junit.Test;
 
 import java.io.IOException;
+import java.util.Collections;
+import java.util.HashSet;
+import java.util.List;
 import java.util.Set;
+import java.util.stream.Collectors;
 
 public class ActionBasedUsedSegmentCheckerTest
 {
-  @Test
-  public void testBasic() throws IOException
+  private TaskActionClient taskActionClient;
+  private ActionBasedUsedSegmentChecker segmentRetriever;
+
+  @Before
+  public void setup()
   {
-    final TaskActionClient taskActionClient = EasyMock.createMock(TaskActionClient.class);
+    taskActionClient = EasyMock.createMock(TaskActionClient.class);
+    segmentRetriever = new ActionBasedUsedSegmentChecker(taskActionClient);
+  }
+
+  @Test
+  public void testRetrieveSegmentsById() throws IOException
+  {
+    final List<DataSegment> segments =
+        CreateDataSegments.ofDatasource("wiki")
+                          .forIntervals(3, Granularities.DAY)
+                          .startingAt("2013-01-01")
+                          .eachOfSizeInMb(400);
+
     EasyMock.expect(
         taskActionClient.submit(
-            new RetrieveUsedSegmentsAction("bar", ImmutableList.of(Intervals.of("2002/P1D")))
-        )
-    ).andReturn(
-        ImmutableList.of(
-            DataSegment.builder()
-                       .dataSource("bar")
-                       .interval(Intervals.of("2002/P1D"))
-                       .shardSpec(new LinearShardSpec(0))
-                       .version("b")
-                       .size(0)
-                       .build(),
-            DataSegment.builder()
-                       .dataSource("bar")
-                       .interval(Intervals.of("2002/P1D"))
-                       .shardSpec(new LinearShardSpec(1))
-                       .version("b")
-                       .size(0)
-                       .build()
-        )
-    );
-    EasyMock.expect(
-        taskActionClient.submit(
-            new RetrieveUsedSegmentsAction(
-                "foo",
-                ImmutableList.of(Intervals.of("2000/P1D"), Intervals.of("2001/P1D"))
+            new RetrieveSegmentsByIdAction(
+                "wiki",
+                segments.stream().map(segment -> segment.getId().toString()).collect(Collectors.toSet())
             )
         )
-    ).andReturn(
-        ImmutableList.of(
-            DataSegment.builder()
-                       .dataSource("foo")
-                       .interval(Intervals.of("2000/P1D"))
-                       .shardSpec(new LinearShardSpec(0))
-                       .version("a")
-                       .size(0)
-                       .build(),
-            DataSegment.builder()
-                       .dataSource("foo")
-                       .interval(Intervals.of("2000/P1D"))
-                       .shardSpec(new LinearShardSpec(1))
-                       .version("a")
-                       .size(0)
-                       .build(),
-            DataSegment.builder()
-                       .dataSource("foo")
-                       .interval(Intervals.of("2001/P1D"))
-                       .shardSpec(new LinearShardSpec(1))
-                       .version("b")
-                       .size(0)
-                       .build(),
-            DataSegment.builder()
-                       .dataSource("foo")
-                       .interval(Intervals.of("2002/P1D"))
-                       .shardSpec(new LinearShardSpec(1))
-                       .version("b")
-                       .size(0)
-                       .build()
-        )
-    );
+    ).andReturn(new HashSet<>(segments)).once();
     EasyMock.replay(taskActionClient);
 
-    final UsedSegmentChecker checker = new ActionBasedUsedSegmentChecker(taskActionClient);
-    final Set<DataSegment> segments = checker.findUsedSegments(
-        ImmutableSet.of(
-            new SegmentIdWithShardSpec("foo", Intervals.of("2000/P1D"), "a", new LinearShardSpec(1)),
-            new SegmentIdWithShardSpec("foo", Intervals.of("2001/P1D"), "b", new LinearShardSpec(0)),
-            new SegmentIdWithShardSpec("bar", Intervals.of("2002/P1D"), "b", new LinearShardSpec(0))
-        )
-    );
-
+    final Set<SegmentId> searchSegmentIds = segments.stream()
+                                                    .map(DataSegment::getId)
+                                                    .collect(Collectors.toSet());
     Assert.assertEquals(
-        ImmutableSet.of(
-            DataSegment.builder()
-                       .dataSource("foo")
-                       .interval(Intervals.of("2000/P1D"))
-                       .shardSpec(new LinearShardSpec(1))
-                       .version("a")
-                       .size(0)
-                       .build(),
-            DataSegment.builder()
-                       .dataSource("bar")
-                       .interval(Intervals.of("2002/P1D"))
-                       .shardSpec(new LinearShardSpec(0))
-                       .version("b")
-                       .size(0)
-                       .build()
-        ),
-        segments
+        new HashSet<>(segments),
+        segmentRetriever.findPublishedSegments(searchSegmentIds)
     );
 
     EasyMock.verify(taskActionClient);
   }
+
+  @Test
+  public void testRetrieveUsedSegmentsIfNotFoundById() throws IOException
+  {
+    final List<DataSegment> segments =
+        CreateDataSegments.ofDatasource("wiki")
+                          .forIntervals(3, Granularities.DAY)
+                          .startingAt("2013-01-01")
+                          .eachOfSizeInMb(400);
+
+    EasyMock.expect(
+        taskActionClient.submit(
+            new RetrieveSegmentsByIdAction("wiki", EasyMock.anyObject())
+        )
+    ).andThrow(InvalidInput.exception("task action not supported yet")).once();
+    EasyMock.expect(
+        taskActionClient.submit(
+            new RetrieveUsedSegmentsAction(
+                "wiki",
+                null,
+                Collections.singletonList(Intervals.of("2013-01-01/P3D")),
+                Segments.INCLUDING_OVERSHADOWED
+            )
+        )
+    ).andReturn(segments).once();
+    EasyMock.replay(taskActionClient);
+
+    final Set<SegmentId> searchSegmentIds = segments.stream()
+                                                    .map(DataSegment::getId)
+                                                    .collect(Collectors.toSet());
+    Assert.assertEquals(
+        new HashSet<>(segments),
+        segmentRetriever.findPublishedSegments(searchSegmentIds)
+    );
+
+    EasyMock.verify(taskActionClient);
+  }
+
+  @Test
+  public void testSegmentsForMultipleDatasourcesThrowsException()
+  {
+    DruidException exception = Assert.assertThrows(
+        DruidException.class,
+        () -> segmentRetriever.findPublishedSegments(
+            ImmutableSet.of(
+                SegmentId.of("wiki", Intervals.ETERNITY, "v1", 0),
+                SegmentId.of("koala", Intervals.ETERNITY, "v1", 0)
+            )
+        )
+    );
+    Assert.assertEquals(
+        "Published segment IDs to find cannot belong to multiple datasources[wiki, koala].",
+        exception.getMessage()
+    );
+  }
 }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
index 3aceae494c6..31a40277b8e 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
@@ -136,6 +136,12 @@ public class TestIndexerMetadataStorageCoordinator implements IndexerMetadataSto
     }
   }
 
+  @Override
+  public Set<DataSegment> retrieveSegmentsById(String dataSource, Set<String> segmentIds)
+  {
+    return Collections.emptySet();
+  }
+
   @Override
   public int markSegmentsAsUnusedWithinInterval(String dataSource, Interval interval)
   {
diff --git a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
index da6dd9ffd95..c02bba6082c 100644
--- a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
@@ -179,6 +179,12 @@ public interface IndexerMetadataStorageCoordinator
       @Nullable DateTime maxUsedStatusLastUpdatedTime
   );
 
+  /**
+   * Retrieves segments for the given IDs, regardless of their visibility
+   * (visible, overshadowed or unused).
+   */
+  Set<DataSegment> retrieveSegmentsById(String dataSource, Set<String> segmentIds);
+
   /**
    * Mark as unused segments which include ONLY data within the given interval.
    *
diff --git a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
index 2b9f328a097..72367330232 100644
--- a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
@@ -320,6 +320,18 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
     return matchingSegments;
   }
 
+  @Override
+  public Set<DataSegment> retrieveSegmentsById(String dataSource, Set<String> segmentIds)
+  {
+    return connector.inReadOnlyTransaction(
+        (handle, transactionStatus) ->
+            retrieveSegmentsById(handle, dataSource, segmentIds)
+                .stream()
+                .map(DataSegmentPlus::getDataSegment)
+                .collect(Collectors.toSet())
+    );
+  }
+
   @Override
   public int markSegmentsAsUnusedWithinInterval(String dataSource, Interval interval)
   {
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BaseAppenderatorDriver.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BaseAppenderatorDriver.java
index 65df4f56761..a192111db4a 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BaseAppenderatorDriver.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BaseAppenderatorDriver.java
@@ -46,6 +46,7 @@ import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.segment.loading.DataSegmentKiller;
 import org.apache.druid.segment.realtime.appenderator.SegmentWithState.SegmentState;
 import org.apache.druid.timeline.DataSegment;
+import org.apache.druid.timeline.SegmentId;
 import org.apache.druid.utils.CollectionUtils;
 import org.joda.time.DateTime;
 import org.joda.time.Interval;
@@ -274,7 +275,7 @@ public abstract class BaseAppenderatorDriver implements Closeable
   {
     this.appenderator = Preconditions.checkNotNull(appenderator, "appenderator");
     this.segmentAllocator = Preconditions.checkNotNull(segmentAllocator, "segmentAllocator");
-    this.usedSegmentChecker = Preconditions.checkNotNull(usedSegmentChecker, "usedSegmentChecker");
+    this.usedSegmentChecker = Preconditions.checkNotNull(usedSegmentChecker, "segmentRetriever");
     this.dataSegmentKiller = Preconditions.checkNotNull(dataSegmentKiller, "dataSegmentKiller");
     this.executor = MoreExecutors.listeningDecorator(
         Execs.singleThreaded("[" + StringUtils.encodeForFormat(appenderator.getId()) + "]-publish")
@@ -622,7 +623,6 @@ public abstract class BaseAppenderatorDriver implements Closeable
           return RetryUtils.retry(
               () -> {
               try {
-                final Set<DataSegment> upgradedSegments = new HashSet<>();
                 final ImmutableSet<DataSegment> ourSegments = ImmutableSet.copyOf(pushedAndTombstones);
                 final SegmentPublishResult publishResult = publisher.publishSegments(
                     segmentsToBeOverwritten,
@@ -633,22 +633,25 @@ public abstract class BaseAppenderatorDriver implements Closeable
                 );
                 if (publishResult.isSuccess()) {
                   log.info(
-                      "Published [%s] segments with commit metadata [%s]",
+                      "Published [%d] segments with commit metadata[%s].",
                       segmentsAndCommitMetadata.getSegments().size(),
                       callerMetadata
                   );
                   log.infoSegments(segmentsAndCommitMetadata.getSegments(), "Published segments");
-                  // This set must contain only those segments that were upgraded as a result of a concurrent replace.
-                  upgradedSegments.addAll(publishResult.getSegments());
+
+                  // Log segments upgraded as a result of a concurrent replace
+                  final Set<DataSegment> upgradedSegments = new HashSet<>(publishResult.getSegments());
                   segmentsAndCommitMetadata.getSegments().forEach(upgradedSegments::remove);
                   if (!upgradedSegments.isEmpty()) {
                     log.info("Published [%d] upgraded segments.", upgradedSegments.size());
                     log.infoSegments(upgradedSegments, "Upgraded segments");
                   }
-                  log.info("Published segment schemas: [%s]", segmentsAndCommitMetadata.getSegmentSchemaMapping());
+
+                  log.info("Published segment schemas[%s].", segmentsAndCommitMetadata.getSegmentSchemaMapping());
+                  return segmentsAndCommitMetadata.withUpgradedSegments(upgradedSegments);
                 } else {
-                  // Publishing didn't affirmatively succeed. However, segments with our identifiers may still be active
-                  // now after all, for two possible reasons:
+                  // Publishing didn't affirmatively succeed. However, segments
+                  // with these IDs may have already been published:
                   //
                   // 1) A replica may have beat us to publishing these segments. In this case we want to delete the
                   //    segments we pushed (if they had unique paths) to avoid wasting space on deep storage.
@@ -656,29 +659,28 @@ public abstract class BaseAppenderatorDriver implements Closeable
                   //    from the overlord. In this case we do not want to delete the segments we pushed, since they are
                   //    now live!
 
-                  final Set<SegmentIdWithShardSpec> segmentsIdentifiers = segmentsAndCommitMetadata
+                  final Set<SegmentId> segmentIds = segmentsAndCommitMetadata
                       .getSegments()
                       .stream()
-                      .map(SegmentIdWithShardSpec::fromDataSegment)
+                      .map(DataSegment::getId)
                       .collect(Collectors.toSet());
 
-                  final Set<DataSegment> activeSegments = usedSegmentChecker.findUsedSegments(segmentsIdentifiers);
-
-                  if (activeSegments.equals(ourSegments)) {
+                  final Set<DataSegment> publishedSegments = usedSegmentChecker.findPublishedSegments(segmentIds);
+                  if (publishedSegments.equals(ourSegments)) {
                     log.info(
-                        "Could not publish [%s] segments, but checked and found them already published; continuing.",
+                        "Could not publish [%d] segments, but they have already been published by another task.",
                         ourSegments.size()
                     );
                     log.infoSegments(
                         segmentsAndCommitMetadata.getSegments(),
                         "Could not publish segments"
                     );
-                    log.info("Could not publish segment and schemas: [%s]", segmentsAndCommitMetadata.getSegmentSchemaMapping());
+                    log.info("Could not publish segment schemas[%s]", segmentsAndCommitMetadata.getSegmentSchemaMapping());
 
                     // Clean up pushed segments if they are physically disjoint from the published ones (this means
                     // they were probably pushed by a replica, and with the unique paths option).
                     final boolean physicallyDisjoint = Sets.intersection(
-                        activeSegments.stream().map(DataSegment::getLoadSpec).collect(Collectors.toSet()),
+                        publishedSegments.stream().map(DataSegment::getLoadSpec).collect(Collectors.toSet()),
                         ourSegments.stream().map(DataSegment::getLoadSpec).collect(Collectors.toSet())
                     ).isEmpty();
 
@@ -698,8 +700,9 @@ public abstract class BaseAppenderatorDriver implements Closeable
                     }
                     throw new ISE("Failed to publish segments");
                   }
+
+                  return segmentsAndCommitMetadata;
                 }
-                return segmentsAndCommitMetadata.withUpgradedSegments(upgradedSegments);
               }
               catch (Exception e) {
                 // Must not remove segments here, we aren't sure if our transaction succeeded or not.
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SegmentsAndCommitMetadata.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SegmentsAndCommitMetadata.java
index 72187688057..dfbfa621a23 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SegmentsAndCommitMetadata.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SegmentsAndCommitMetadata.java
@@ -26,16 +26,12 @@ import org.apache.druid.segment.SegmentUtils;
 import org.apache.druid.timeline.DataSegment;
 
 import javax.annotation.Nullable;
-import java.util.Collections;
 import java.util.List;
 import java.util.Objects;
 import java.util.Set;
 
 public class SegmentsAndCommitMetadata
 {
-  private static final SegmentsAndCommitMetadata NIL
-      = new SegmentsAndCommitMetadata(Collections.emptyList(), null, null, null);
-
   private final Object commitMetadata;
   private final ImmutableList<DataSegment> segments;
   private final SegmentSchemaMapping segmentSchemaMapping;
@@ -139,9 +135,4 @@ public class SegmentsAndCommitMetadata
            ", segmentSchemaMapping=" + segmentSchemaMapping +
            '}';
   }
-
-  public static SegmentsAndCommitMetadata nil()
-  {
-    return NIL;
-  }
 }
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UsedSegmentChecker.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UsedSegmentChecker.java
index 29fd6028f82..3ab966009b0 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UsedSegmentChecker.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UsedSegmentChecker.java
@@ -20,6 +20,7 @@
 package org.apache.druid.segment.realtime.appenderator;
 
 import org.apache.druid.timeline.DataSegment;
+import org.apache.druid.timeline.SegmentId;
 
 import java.io.IOException;
 import java.util.Set;
@@ -28,10 +29,6 @@ public interface UsedSegmentChecker
 {
   /**
    * For any identifiers that exist and are actually used, returns the corresponding DataSegment objects.
-   *
-   * @param identifiers identifiers to search for
-   *
-   * @return used DataSegments
    */
-  Set<DataSegment> findUsedSegments(Set<SegmentIdWithShardSpec> identifiers) throws IOException;
+  Set<DataSegment> findPublishedSegments(Set<SegmentId> identifiers) throws IOException;
 }
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java
index 5a21a4331fe..e3ed8fd49d7 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java
@@ -46,6 +46,7 @@ import org.apache.druid.segment.realtime.appenderator.StreamAppenderatorDriverTe
 import org.apache.druid.segment.realtime.appenderator.StreamAppenderatorDriverTest.TestSegmentAllocator;
 import org.apache.druid.segment.realtime.appenderator.StreamAppenderatorDriverTest.TestSegmentHandoffNotifierFactory;
 import org.apache.druid.timeline.DataSegment;
+import org.apache.druid.timeline.SegmentId;
 import org.apache.druid.timeline.partition.NumberedShardSpec;
 import org.easymock.EasyMock;
 import org.easymock.EasyMockSupport;
@@ -326,7 +327,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
   private static class NoopUsedSegmentChecker implements UsedSegmentChecker
   {
     @Override
-    public Set<DataSegment> findUsedSegments(Set<SegmentIdWithShardSpec> identifiers)
+    public Set<DataSegment> findPublishedSegments(Set<SegmentId> identifiers)
     {
       return ImmutableSet.of();
     }
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestUsedSegmentChecker.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestUsedSegmentChecker.java
index 91ee44d1ce1..37612b11776 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestUsedSegmentChecker.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestUsedSegmentChecker.java
@@ -20,6 +20,7 @@
 package org.apache.druid.segment.realtime.appenderator;
 
 import org.apache.druid.timeline.DataSegment;
+import org.apache.druid.timeline.SegmentId;
 import org.apache.druid.timeline.SegmentTimeline;
 import org.apache.druid.timeline.TimelineObjectHolder;
 import org.apache.druid.timeline.partition.PartitionChunk;
@@ -38,14 +39,14 @@ public class TestUsedSegmentChecker implements UsedSegmentChecker
   }
 
   @Override
-  public Set<DataSegment> findUsedSegments(Set<SegmentIdWithShardSpec> identifiers)
+  public Set<DataSegment> findPublishedSegments(Set<SegmentId> identifiers)
   {
     final SegmentTimeline timeline = SegmentTimeline.forSegments(pushedSegments);
     final Set<DataSegment> retVal = new HashSet<>();
-    for (SegmentIdWithShardSpec identifier : identifiers) {
-      for (TimelineObjectHolder<String, DataSegment> holder : timeline.lookup(identifier.getInterval())) {
+    for (SegmentId segmentId : identifiers) {
+      for (TimelineObjectHolder<String, DataSegment> holder : timeline.lookup(segmentId.getInterval())) {
         for (PartitionChunk<DataSegment> chunk : holder.getObject()) {
-          if (identifiers.contains(SegmentIdWithShardSpec.fromDataSegment(chunk.getObject()))) {
+          if (identifiers.contains(chunk.getObject().getId())) {
             retVal.add(chunk.getObject());
           }
         }

From 990fd5f5fbbc0140c8ff7f17af84216ce45b53f0 Mon Sep 17 00:00:00 2001
From: Sree Charan Manamala <sree.manamala@imply.io>
Date: Mon, 24 Jun 2024 19:22:41 +0530
Subject: [PATCH 14/72] Make use group iterator for all window frames & support
 for same bound kinds (#16603)

Fixes apache/druid#15739
---
 .../query/operator/window/WindowFrame.java    |   4 +-
 .../DefaultFramedOnHeapAggregatable.java      | 510 ++----------------
 .../FramedOnHeapAggregatableTest.java         |  22 +-
 .../calcite/planner/DruidSqlValidator.java    |  11 -
 .../druid/sql/calcite/rel/Windowing.java      |   4 +-
 .../druid/sql/calcite/CalciteQueryTest.java   |  20 -
 .../sql/calcite/CalciteWindowQueryTest.java   |  46 ++
 ...ipediaAggregationsMultipleOrdering.sqlTest |   2 +-
 .../wikipediaFramedAggregations.sqlTest       |   2 +-
 9 files changed, 101 insertions(+), 520 deletions(-)

diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/WindowFrame.java b/processing/src/main/java/org/apache/druid/query/operator/window/WindowFrame.java
index b70df2c5203..fca50c25b28 100644
--- a/processing/src/main/java/org/apache/druid/query/operator/window/WindowFrame.java
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/WindowFrame.java
@@ -161,9 +161,9 @@ public class WindowFrame
   public int getLowerOffsetClamped(int maxRows)
   {
     if (lowerUnbounded) {
-      return maxRows;
+      return -maxRows;
     }
-    return Math.min(maxRows, lowerOffset);
+    return Math.max(-maxRows, lowerOffset);
   }
 
   /**
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/semantic/DefaultFramedOnHeapAggregatable.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/semantic/DefaultFramedOnHeapAggregatable.java
index 106fa9674a0..19bc6170c12 100644
--- a/processing/src/main/java/org/apache/druid/query/rowsandcols/semantic/DefaultFramedOnHeapAggregatable.java
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/semantic/DefaultFramedOnHeapAggregatable.java
@@ -29,7 +29,6 @@ import org.apache.druid.query.dimension.DimensionSpec;
 import org.apache.druid.query.monomorphicprocessing.RuntimeShapeInspector;
 import org.apache.druid.query.operator.window.WindowFrame;
 import org.apache.druid.query.rowsandcols.RowsAndColumns;
-import org.apache.druid.query.rowsandcols.column.ConstantObjectColumn;
 import org.apache.druid.query.rowsandcols.column.ObjectArrayColumn;
 import org.apache.druid.segment.ColumnSelectorFactory;
 import org.apache.druid.segment.ColumnValueSelector;
@@ -61,34 +60,15 @@ public class DefaultFramedOnHeapAggregatable implements FramedOnHeapAggregatable
       AggregatorFactory[] aggFactories
   )
   {
-    if (frame.isLowerUnbounded() && frame.isUpperUnbounded()) {
-      return computeUnboundedAggregates(aggFactories);
-    }
-
-    if (frame.getPeerType() == WindowFrame.PeerType.ROWS) {
-      if (frame.isLowerUnbounded()) {
-        return computeCumulativeAggregates(aggFactories, frame.getUpperOffset());
-      } else if (frame.isUpperUnbounded()) {
-        return computeReverseCumulativeAggregates(aggFactories, frame.getLowerOffset());
-      } else {
-        final int numRows = rac.numRows();
-        int lowerOffset = frame.getLowerOffset();
-        int upperOffset = frame.getUpperOffset();
-
-        if (numRows < lowerOffset + upperOffset + 1) {
-          // In this case, there are not enough rows to completely build up the full window aperture before it needs to
-          // also start contracting the aperture because of the upper offset. So we use a method that specifically
-          // handles checks for both expanding and reducing the aperture on every iteration.
-          return aggregateWindowApertureInFlux(aggFactories, lowerOffset, upperOffset);
-        } else {
-          // In this case, there are 3 distinct phases that allow us to loop with less
-          // branches, so we have a method that specifically does that.
-          return aggregateWindowApertureWellBehaved(aggFactories, lowerOffset, upperOffset);
-        }
-      }
-    } else {
-      return computeGroupAggregates(aggFactories, frame);
+    Iterable<AggInterval> groupIterator = buildIteratorFor(rac, frame);
+    ResultPopulator resultRac = new ResultPopulator(aggFactories, rac.numRows());
+    AggIntervalCursor aggCursor = new AggIntervalCursor(rac, aggFactories);
+    for (AggInterval aggInterval : groupIterator) {
+      aggCursor.moveTo(aggInterval.inputRows);
+      resultRac.write(aggInterval.outputRows, aggCursor);
     }
+    resultRac.appendTo(rac);
+    return rac;
   }
 
   /**
@@ -124,22 +104,34 @@ public class DefaultFramedOnHeapAggregatable implements FramedOnHeapAggregatable
     }
   }
 
-  private RowsAndColumns computeGroupAggregates(
-      AggregatorFactory[] aggFactories,
-      WindowFrame frame)
+  public static Iterable<AggInterval> buildIteratorFor(AppendableRowsAndColumns rac, WindowFrame frame)
   {
-    Iterable<AggInterval> groupIterator = buildGroupIteratorFor(rac, frame);
-    ResultPopulator resultRac = new ResultPopulator(aggFactories, rac.numRows());
-    AggIntervalCursor aggCursor = new AggIntervalCursor(rac, aggFactories);
-    for (AggInterval aggInterval : groupIterator) {
-      aggCursor.moveTo(aggInterval.inputRows);
-      resultRac.write(aggInterval.outputRows, aggCursor);
+    int numRows = rac.numRows();
+    if (frame.getLowerOffsetClamped(numRows) == -numRows && frame.getUpperOffsetClamped(numRows) == numRows) {
+      return buildUnboundedIteratorFor(rac, frame);
+    } else if (frame.getPeerType() == WindowFrame.PeerType.RANGE) {
+      return buildGroupIteratorFor(rac, frame);
+    } else {
+      return buildRowIteratorFor(rac, frame);
     }
-    resultRac.appendTo(rac);
-    return rac;
   }
 
-  public static Iterable<AggInterval> buildGroupIteratorFor(AppendableRowsAndColumns rac, WindowFrame frame)
+  private static Iterable<AggInterval> buildUnboundedIteratorFor(AppendableRowsAndColumns rac, WindowFrame frame)
+  {
+    int[] groupBoundaries = new int[]{0, rac.numRows()};
+    return new GroupIteratorForWindowFrame(frame, groupBoundaries);
+  }
+
+  private static Iterable<AggInterval> buildRowIteratorFor(AppendableRowsAndColumns rac, WindowFrame frame)
+  {
+    int[] groupBoundaries = new int[rac.numRows() + 1];
+    for (int j = 0; j < groupBoundaries.length; j++) {
+      groupBoundaries[j] = j;
+    }
+    return new GroupIteratorForWindowFrame(frame, groupBoundaries);
+  }
+
+  private static Iterable<AggInterval> buildGroupIteratorFor(AppendableRowsAndColumns rac, WindowFrame frame)
   {
     int[] groupBoundaries = ClusteredGroupPartitioner.fromRAC(rac).computeBoundaries(frame.getOrderByColNames());
     return new GroupIteratorForWindowFrame(frame, groupBoundaries);
@@ -187,7 +179,7 @@ public class DefaultFramedOnHeapAggregatable implements FramedOnHeapAggregatable
                   groupToRowIndex(relativeGroupId(1))
               ),
               Interval.of(
-                  groupToRowIndex(relativeGroupId(-lowerOffset)),
+                  groupToRowIndex(relativeGroupId(lowerOffset)),
                   groupToRowIndex(relativeGroupId(upperOffset))
               )
           );
@@ -365,6 +357,10 @@ public class DefaultFramedOnHeapAggregatable implements FramedOnHeapAggregatable
         for (int i = currentRows.b; i < newRows.b; i++) {
           aggregate(i);
         }
+      } else if (currentRows.a > newRows.a && currentRows.b == newRows.b) {
+        for (int i = newRows.a; i < currentRows.a; i++) {
+          aggregate(i);
+        }
       } else {
         newAggregators();
         for (int i : newRows) {
@@ -390,428 +386,6 @@ public class DefaultFramedOnHeapAggregatable implements FramedOnHeapAggregatable
     }
   }
 
-  private AppendableRowsAndColumns computeUnboundedAggregates(AggregatorFactory[] aggFactories)
-  {
-    Aggregator[] aggs = new Aggregator[aggFactories.length];
-
-
-    AtomicInteger currRow = new AtomicInteger(0);
-    final ColumnSelectorFactory columnSelectorFactory = ColumnSelectorFactoryMaker.fromRAC(rac).make(currRow);
-
-    for (int i = 0; i < aggFactories.length; i++) {
-      aggs[i] = aggFactories[i].factorize(columnSelectorFactory);
-    }
-
-    int numRows = rac.numRows();
-    int rowId = currRow.get();
-    while (rowId < numRows) {
-      for (Aggregator agg : aggs) {
-        agg.aggregate();
-      }
-      rowId = currRow.incrementAndGet();
-    }
-
-    for (int i = 0; i < aggFactories.length; ++i) {
-      rac.addColumn(
-          aggFactories[i].getName(),
-          new ConstantObjectColumn(aggs[i].get(), numRows, aggFactories[i].getIntermediateType())
-      );
-      aggs[i].close();
-    }
-    return rac;
-  }
-
-  private AppendableRowsAndColumns computeCumulativeAggregates(AggregatorFactory[] aggFactories, int upperOffset)
-  {
-    int numRows = rac.numRows();
-    if (upperOffset > numRows) {
-      return computeUnboundedAggregates(aggFactories);
-    }
-
-
-    // We store the results in an Object array for convenience.  This is definitely sub-par from a memory management
-    // point of view as we should use native arrays when possible.  This will be fine for now, but it probably makes
-    // sense to look at optimizing this in the future.  That said, such an optimization might best come by having
-    // a specialized implementation of this interface against, say, a Frame object that can deal with arrays instead
-    // of trying to optimize this generic implementation.
-    Object[][] results = new Object[aggFactories.length][numRows];
-    int resultStorageIndex = 0;
-
-    AtomicInteger rowIdProvider = new AtomicInteger(0);
-    final ColumnSelectorFactory columnSelectorFactory = ColumnSelectorFactoryMaker.fromRAC(rac).make(rowIdProvider);
-
-    AggregatorFactory[] combiningFactories = new AggregatorFactory[aggFactories.length];
-    Aggregator[] aggs = new Aggregator[aggFactories.length];
-    for (int i = 0; i < aggFactories.length; i++) {
-      combiningFactories[i] = aggFactories[i].getCombiningFactory();
-      aggs[i] = aggFactories[i].factorize(columnSelectorFactory);
-    }
-
-    // If there is an upper offset, we accumulate those aggregations before starting to generate results
-    for (int i = 0; i < upperOffset; ++i) {
-      for (Aggregator agg : aggs) {
-        agg.aggregate();
-      }
-      rowIdProvider.incrementAndGet();
-    }
-
-    // Prime the results
-    if (rowIdProvider.get() < numRows) {
-      for (int i = 0; i < aggs.length; i++) {
-        aggs[i].aggregate();
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(aggs[i].get());
-        aggs[i].close();
-        aggs[i] = aggFactories[i].factorize(columnSelectorFactory);
-      }
-
-      ++resultStorageIndex;
-      rowIdProvider.incrementAndGet();
-    }
-
-    // From here out, we want to aggregate, peel off a row of results and then accumulate the aggregation
-    for (int rowId = rowIdProvider.get(); rowId < numRows; ++rowId) {
-      for (int i = 0; i < aggs.length; i++) {
-        aggs[i].aggregate();
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(aggs[i].get());
-        aggs[i].close();
-
-        // Use a combining aggregator to combine the result we just got with the result from the previous row
-        // This is a lot of hoops to jump through just to combine two values, but AggregatorFactory.combine
-        // allows for mutation of either of the arguments passed in, so it cannot be meaningfully used in this
-        // context.  Instead, we have to jump through these hoops to make sure that we are generating a new object.
-        // It would've been nice if the AggregatorFactory interface had methods that were more usable for this,
-        // but it doesn't so :shrug:
-        final CumulativeColumnSelectorFactory combiningFactory = new CumulativeColumnSelectorFactory(
-            aggFactories[i],
-            results[i],
-            resultStorageIndex - 1
-        );
-        final Aggregator combiningAgg = combiningFactories[i].factorize(combiningFactory);
-        combiningAgg.aggregate();
-        combiningFactory.increment();
-        combiningAgg.aggregate();
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(combiningAgg.get());
-        combiningAgg.close();
-
-        aggs[i] = aggFactories[i].factorize(columnSelectorFactory);
-      }
-
-      ++resultStorageIndex;
-      rowIdProvider.incrementAndGet();
-    }
-
-    // If we haven't filled up all of the results yet, there are no more rows, so just point the rest of the results
-    // at the last result that we generated
-    for (Object[] resultArr : results) {
-      Arrays.fill(resultArr, resultStorageIndex, resultArr.length, resultArr[resultStorageIndex - 1]);
-    }
-
-    return makeReturnRAC(aggFactories, results);
-  }
-
-  private AppendableRowsAndColumns computeReverseCumulativeAggregates(AggregatorFactory[] aggFactories, int lowerOffset)
-  {
-    int numRows = rac.numRows();
-    if (lowerOffset > numRows) {
-      return computeUnboundedAggregates(aggFactories);
-    }
-
-    // We store the results in an Object array for convenience.  This is definitely sub-par from a memory management
-    // point of view as we should use native arrays when possible.  This will be fine for now, but it probably makes
-    // sense to look at optimizing this in the future.  That said, such an optimization might best come by having
-    // a specialized implementation of this interface against, say, a Frame object that can deal with arrays instead
-    // of trying to optimize this generic implementation.
-    Object[][] results = new Object[aggFactories.length][numRows];
-    int resultStorageIndex = numRows - 1;
-
-    AtomicInteger rowIdProvider = new AtomicInteger(numRows - 1);
-    final ColumnSelectorFactory columnSelectorFactory = ColumnSelectorFactoryMaker.fromRAC(rac).make(rowIdProvider);
-
-    AggregatorFactory[] combiningFactories = new AggregatorFactory[aggFactories.length];
-    Aggregator[] aggs = new Aggregator[aggFactories.length];
-    for (int i = 0; i < aggFactories.length; i++) {
-      combiningFactories[i] = aggFactories[i].getCombiningFactory();
-      aggs[i] = aggFactories[i].factorize(columnSelectorFactory);
-    }
-
-    // If there is a lower offset, we accumulate those aggregations before starting to generate results
-    for (int i = 0; i < lowerOffset; ++i) {
-      for (Aggregator agg : aggs) {
-        agg.aggregate();
-      }
-      rowIdProvider.decrementAndGet();
-    }
-
-    // Prime the results
-    if (rowIdProvider.get() >= 0) {
-      for (int i = 0; i < aggs.length; i++) {
-        aggs[i].aggregate();
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(aggs[i].get());
-        aggs[i].close();
-        aggs[i] = aggFactories[i].factorize(columnSelectorFactory);
-      }
-
-      --resultStorageIndex;
-      rowIdProvider.decrementAndGet();
-    }
-
-    // From here out, we want to aggregate, peel off a row of results and then accumulate the aggregation
-    for (int rowId = rowIdProvider.get(); rowId >= 0; --rowId) {
-      for (int i = 0; i < aggs.length; i++) {
-        aggs[i].aggregate();
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(aggs[i].get());
-        aggs[i].close();
-
-        // Use a combining aggregator to combine the result we just got with the result from the previous row
-        // This is a lot of hoops to jump through just to combine two values, but AggregatorFactory.combine
-        // allows for mutation of either of the arguments passed in, so it cannot be meaningfully used in this
-        // context.  Instead, we have to jump through these hoops to make sure that we are generating a new object.
-        // It would've been nice if the AggregatorFactory interface had methods that were more usable for this,
-        // but it doesn't so :shrug:
-        final CumulativeColumnSelectorFactory combiningFactory = new CumulativeColumnSelectorFactory(
-            aggFactories[i],
-            results[i],
-            resultStorageIndex + 1
-        );
-        final Aggregator combiningAgg = combiningFactories[i].factorize(combiningFactory);
-        combiningAgg.aggregate();
-        combiningFactory.decrement();
-        combiningAgg.aggregate();
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(combiningAgg.get());
-        combiningAgg.close();
-
-        aggs[i] = aggFactories[i].factorize(columnSelectorFactory);
-      }
-
-      --resultStorageIndex;
-      rowIdProvider.decrementAndGet();
-    }
-
-    // If we haven't filled up all of the results yet, there are no more rows, so just point the rest of the results
-    // at the last result that we generated
-    for (Object[] resultArr : results) {
-      Arrays.fill(resultArr, 0, resultStorageIndex + 1, resultArr[resultStorageIndex + 1]);
-    }
-
-    return makeReturnRAC(aggFactories, results);
-  }
-
-  private AppendableRowsAndColumns aggregateWindowApertureWellBehaved(
-      AggregatorFactory[] aggFactories,
-      int lowerOffset,
-      int upperOffset
-  )
-  {
-    // There are 3 different phases of operation when we have more rows than our window size
-    // 1. Our window is not full, as we walk the rows we build up towards filling it
-    // 2. Our window is full, as we walk the rows we take a value off and add a new aggregation
-    // 3. We are nearing the end of the rows, we need to start shrinking the window aperture
-
-    int numRows = rac.numRows();
-    int windowSize = lowerOffset + upperOffset + 1;
-
-    // We store the results in an Object array for convenience.  This is definitely sub-par from a memory management
-    // point of view as we should use native arrays when possible.  This will be fine for now, but it probably makes
-    // sense to look at optimizing this in the future.  That said, such an optimization might best come by having
-    // a specialized implementation of this interface against, say, a Frame object that can deal with arrays instead
-    // of trying to optimize this generic implementation.
-    Object[][] results = new Object[aggFactories.length][numRows];
-    int resultStorageIndex = 0;
-
-    AtomicInteger rowIdProvider = new AtomicInteger(0);
-    final ColumnSelectorFactory columnSelectorFactory = ColumnSelectorFactoryMaker.fromRAC(rac).make(rowIdProvider);
-
-    // This is the number of aggregators to actually aggregate for the current row.
-    // Which also doubles as the nextIndex to roll through as we roll things in and out of the window
-    int nextIndex = lowerOffset + 1;
-
-    Aggregator[][] aggregators = new Aggregator[aggFactories.length][windowSize];
-    for (int i = 0; i < aggregators.length; i++) {
-      final AggregatorFactory aggFactory = aggFactories[i];
-      // instantiate the aggregators that need to be read on the first row.
-      for (int j = 0; j < nextIndex; j++) {
-        aggregators[i][j] = aggFactory.factorize(columnSelectorFactory);
-      }
-    }
-
-    // The first few rows will slowly build out the window to consume the upper-offset.  The window will not
-    // be full until we have walked upperOffset number of rows, so phase 1 runs until we have consumed
-    // upperOffset number of rows.
-    for (int upperIndex = 0; upperIndex < upperOffset; ++upperIndex) {
-      for (Aggregator[] aggregator : aggregators) {
-        for (int j = 0; j < nextIndex; ++j) {
-          aggregator[j].aggregate();
-        }
-      }
-
-      for (int i = 0; i < aggFactories.length; ++i) {
-        aggregators[i][nextIndex] = aggFactories[i].factorize(columnSelectorFactory);
-      }
-      ++nextIndex;
-      rowIdProvider.incrementAndGet();
-    }
-
-    // End Phase 1, Enter Phase 2.  At this point, nextIndex == windowSize, rowIdProvider is the same as
-    // upperOffset and the aggregators matrix is entirely non-null.  We need to iterate until our window has all of
-    // the aggregators in it to fill up the final result set.
-    int endResultStorageIndex = numRows - windowSize;
-    for (; resultStorageIndex < endResultStorageIndex; ++resultStorageIndex) {
-      for (Aggregator[] aggregator : aggregators) {
-        for (Aggregator value : aggregator) {
-          value.aggregate();
-        }
-      }
-
-      if (nextIndex == windowSize) {
-        // Wrap back around and start pruning from the beginning of the window
-        nextIndex = 0;
-      }
-
-      for (int i = 0; i < aggFactories.length; ++i) {
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(aggregators[i][nextIndex].get());
-        aggregators[i][nextIndex].close();
-        aggregators[i][nextIndex] = aggFactories[i].factorize(columnSelectorFactory);
-      }
-
-      ++nextIndex;
-      rowIdProvider.incrementAndGet();
-    }
-
-    if (nextIndex == windowSize) {
-      nextIndex = 0;
-    }
-
-    // End Phase 2, enter Phase 3.  At this point, our window has enough aggregators in it to fill up our final
-    // result set.  This means that for each new row that we complete, the window will "shrink" until we hit numRows,
-    // at which point we will collect anything yet remaining and be done.
-
-    if (nextIndex != 0) {
-      // Start by organizing the aggregators so that we are 0-indexed from nextIndex.  This trades off creating
-      // a new array of references in exchange for removing branches inside of the loop.  It also makes the logic
-      // simpler to understand.
-
-      Aggregator[][] reorganizedAggs = new Aggregator[aggFactories.length][windowSize];
-      for (int i = 0; i < aggFactories.length; i++) {
-        System.arraycopy(aggregators[i], nextIndex, reorganizedAggs[i], 0, windowSize - nextIndex);
-        System.arraycopy(aggregators[i], 0, reorganizedAggs[i], windowSize - nextIndex, nextIndex);
-      }
-      aggregators = reorganizedAggs;
-      nextIndex = 0;
-    }
-
-    for (int rowId = rowIdProvider.get(); rowId < numRows; ++rowId) {
-      for (Aggregator[] aggregator : aggregators) {
-        for (int j = nextIndex; j < aggregator.length; ++j) {
-          aggregator[j].aggregate();
-        }
-      }
-
-      for (int i = 0; i < aggFactories.length; ++i) {
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(aggregators[i][nextIndex].get());
-        aggregators[i][nextIndex].close();
-        aggregators[i][nextIndex] = null;
-      }
-
-      ++nextIndex;
-      ++resultStorageIndex;
-      rowIdProvider.incrementAndGet();
-    }
-
-    // End Phase 3, anything left in the window needs to be collected and put into our results
-    for (; nextIndex < windowSize; ++nextIndex) {
-      for (int i = 0; i < aggFactories.length; ++i) {
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(aggregators[i][nextIndex].get());
-        aggregators[i][nextIndex].close();
-        aggregators[i][nextIndex] = null;
-      }
-      ++resultStorageIndex;
-    }
-
-    return makeReturnRAC(aggFactories, results);
-  }
-
-  private AppendableRowsAndColumns aggregateWindowApertureInFlux(
-      AggregatorFactory[] aggFactories,
-      int lowerOffset,
-      int upperOffset
-  )
-  {
-    // In this case, we need to store a value for all items, so our windowSize is equivalent to the number of rows
-    // from the RowsAndColumns object that we are using.
-    int windowSize = rac.numRows();
-
-    // We store the results in an Object array for convenience.  This is definitely sub-par from a memory management
-    // point of view as we should use native arrays when possible.  This will be fine for now, but it probably makes
-    // sense to look at optimizing this in the future.  That said, such an optimization might best come by having
-    // a specialized implementation of this interface against, say, a Frame object that can deal with arrays instead
-    // of trying to optimize this generic implementation.
-    Object[][] results = new Object[aggFactories.length][windowSize];
-    int resultStorageIndex = 0;
-
-    AtomicInteger rowIdProvider = new AtomicInteger(0);
-    final ColumnSelectorFactory columnSelectorFactory = ColumnSelectorFactoryMaker.fromRAC(rac).make(rowIdProvider);
-
-    Aggregator[][] aggregators = new Aggregator[aggFactories.length][windowSize];
-    for (int i = 0; i < aggregators.length; i++) {
-      final AggregatorFactory aggFactory = aggFactories[i];
-      for (int j = 0; j < aggregators[i].length; j++) {
-        aggregators[i][j] = aggFactory.factorize(columnSelectorFactory);
-      }
-    }
-
-    // This is the index to stop at for the current window aperture
-    // The first row is used by all of the results for the lowerOffset num results, plus 1 for the "current row"
-    int stopIndex = Math.min(lowerOffset + 1, windowSize);
-
-    int startIndex = 0;
-    int rowId = rowIdProvider.get();
-    while (rowId < windowSize) {
-      for (Aggregator[] aggregator : aggregators) {
-        for (int j = startIndex; j < stopIndex; ++j) {
-          aggregator[j].aggregate();
-        }
-      }
-
-      if (rowId >= upperOffset) {
-        for (int i = 0; i < aggregators.length; ++i) {
-          results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(aggregators[i][startIndex].get());
-          aggregators[i][startIndex].close();
-          aggregators[i][startIndex] = null;
-        }
-
-        ++resultStorageIndex;
-        ++startIndex;
-      }
-
-      if (stopIndex < windowSize) {
-        ++stopIndex;
-      }
-      rowId = rowIdProvider.incrementAndGet();
-    }
-
-
-    for (; startIndex < windowSize; ++startIndex) {
-      for (int i = 0; i < aggregators.length; ++i) {
-        results[i][resultStorageIndex] = aggFactories[i].finalizeComputation(aggregators[i][startIndex].get());
-        aggregators[i][startIndex].close();
-        aggregators[i][startIndex] = null;
-      }
-      ++resultStorageIndex;
-    }
-
-    return makeReturnRAC(aggFactories, results);
-  }
-
-  private AppendableRowsAndColumns makeReturnRAC(AggregatorFactory[] aggFactories, Object[][] results)
-  {
-    for (int i = 0; i < aggFactories.length; ++i) {
-      rac.addColumn(
-          aggFactories[i].getName(), new ObjectArrayColumn(results[i], aggFactories[i].getIntermediateType())
-      );
-    }
-    return rac;
-  }
-
   private static class CumulativeColumnSelectorFactory implements ColumnSelectorFactory
   {
     private final ColumnCapabilitiesImpl columnCapabilities;
@@ -831,16 +405,6 @@ public class DefaultFramedOnHeapAggregatable implements FramedOnHeapAggregatable
           .setType(factory.getIntermediateType());
     }
 
-    public void increment()
-    {
-      ++index;
-    }
-
-    public void decrement()
-    {
-      --index;
-    }
-
     @Override
     @Nonnull
     public DimensionSelector makeDimensionSelector(@Nonnull DimensionSpec dimensionSpec)
diff --git a/processing/src/test/java/org/apache/druid/query/rowsandcols/semantic/FramedOnHeapAggregatableTest.java b/processing/src/test/java/org/apache/druid/query/rowsandcols/semantic/FramedOnHeapAggregatableTest.java
index d00e12b3b66..d5b11f7a612 100644
--- a/processing/src/test/java/org/apache/druid/query/rowsandcols/semantic/FramedOnHeapAggregatableTest.java
+++ b/processing/src/test/java/org/apache/druid/query/rowsandcols/semantic/FramedOnHeapAggregatableTest.java
@@ -91,7 +91,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     FramedOnHeapAggregatable agger = FramedOnHeapAggregatable.fromRAC(rac);
 
     final RowsAndColumns results = agger.aggregateAll(
-        new WindowFrame(WindowFrame.PeerType.ROWS, false, 1, false, 2, null),
+        new WindowFrame(WindowFrame.PeerType.ROWS, false, -1, false, 2, null),
         new AggregatorFactory[]{
             new LongSumAggregatorFactory("sumFromLong", "intCol"),
             new DoubleMaxAggregatorFactory("maxFromInt", "intCol"),
@@ -143,7 +143,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     FramedOnHeapAggregatable agger = FramedOnHeapAggregatable.fromRAC(rac);
 
     final RowsAndColumns results = agger.aggregateAll(
-        new WindowFrame(WindowFrame.PeerType.ROWS, false, 2, false, 0, null),
+        new WindowFrame(WindowFrame.PeerType.ROWS, false, -2, false, 0, null),
         new AggregatorFactory[]{
             new LongSumAggregatorFactory("sumFromLong", "intCol"),
             new DoubleMaxAggregatorFactory("maxFromInt", "intCol"),
@@ -169,7 +169,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     FramedOnHeapAggregatable agger = FramedOnHeapAggregatable.fromRAC(rac);
 
     final RowsAndColumns results = agger.aggregateAll(
-        new WindowFrame(WindowFrame.PeerType.ROWS, false, 5, false, 7, null),
+        new WindowFrame(WindowFrame.PeerType.ROWS, false, -5, false, 7, null),
         new AggregatorFactory[]{
             new LongSumAggregatorFactory("sumFromLong", "intCol"),
             new DoubleMaxAggregatorFactory("maxFromInt", "intCol"),
@@ -197,7 +197,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     FramedOnHeapAggregatable agger = FramedOnHeapAggregatable.fromRAC(rac);
 
     final RowsAndColumns results = agger.aggregateAll(
-        new WindowFrame(WindowFrame.PeerType.ROWS, false, 5, false, 1, null),
+        new WindowFrame(WindowFrame.PeerType.ROWS, false, -5, false, 1, null),
         new AggregatorFactory[]{
             new LongSumAggregatorFactory("sumFromLong", "intCol"),
             new DoubleMaxAggregatorFactory("maxFromInt", "intCol"),
@@ -225,7 +225,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     FramedOnHeapAggregatable agger = FramedOnHeapAggregatable.fromRAC(rac);
 
     final RowsAndColumns results = agger.aggregateAll(
-        new WindowFrame(WindowFrame.PeerType.ROWS, false, 5, false, 0, null),
+        new WindowFrame(WindowFrame.PeerType.ROWS, false, -5, false, 0, null),
         new AggregatorFactory[]{
             new LongSumAggregatorFactory("sumFromLong", "intCol"),
             new DoubleMaxAggregatorFactory("maxFromInt", "intCol"),
@@ -253,7 +253,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     FramedOnHeapAggregatable agger = FramedOnHeapAggregatable.fromRAC(rac);
 
     final RowsAndColumns results = agger.aggregateAll(
-        new WindowFrame(WindowFrame.PeerType.ROWS, false, 1, false, 7, null),
+        new WindowFrame(WindowFrame.PeerType.ROWS, false, -1, false, 7, null),
         new AggregatorFactory[]{
             new LongSumAggregatorFactory("sumFromLong", "intCol"),
             new DoubleMaxAggregatorFactory("maxFromInt", "intCol"),
@@ -337,7 +337,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     FramedOnHeapAggregatable agger = FramedOnHeapAggregatable.fromRAC(rac);
 
     final RowsAndColumns results = agger.aggregateAll(
-        new WindowFrame(WindowFrame.PeerType.ROWS, false, 5, false, 0, null),
+        new WindowFrame(WindowFrame.PeerType.ROWS, false, -5, false, 0, null),
         new AggregatorFactory[]{
             new LongSumAggregatorFactory("sumFromLong", "intCol"),
             new DoubleMaxAggregatorFactory("maxFromInt", "intCol"),
@@ -479,7 +479,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     WindowFrame frame = new WindowFrame(
         PeerType.RANGE,
         false,
-        1,
+        -1,
         false,
         0,
         Collections.singletonList(ColumnWithDirection.ascending("c1"))
@@ -517,7 +517,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     WindowFrame frame = new WindowFrame(
         PeerType.RANGE,
         false,
-        1,
+        -1,
         false,
         1,
         Collections.singletonList(ColumnWithDirection.ascending("c1"))
@@ -537,7 +537,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     WindowFrame frame = new WindowFrame(
         PeerType.RANGE,
         false,
-        1,
+        -1,
         false,
         1,
         Collections.singletonList(ColumnWithDirection.ascending("c1"))
@@ -556,7 +556,7 @@ public class FramedOnHeapAggregatableTest extends SemanticTestBase
     WindowFrame frame = new WindowFrame(
         PeerType.RANGE,
         false,
-        1,
+        -1,
         false,
         2,
         Collections.singletonList(ColumnWithDirection.ascending("c1"))
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidSqlValidator.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidSqlValidator.java
index a6319c40f66..d399786676c 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidSqlValidator.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidSqlValidator.java
@@ -135,16 +135,6 @@ public class DruidSqlValidator extends BaseDruidSqlValidator
       );
     }
 
-    if (isPrecedingOrFollowing(lowerBound) &&
-        isPrecedingOrFollowing(upperBound) &&
-        lowerBound.getKind() == upperBound.getKind()) {
-      // this limitation can be lifted when https://github.com/apache/druid/issues/15739 is addressed
-      throw buildCalciteContextException(
-          "Query bounds with both lower and upper bounds as PRECEDING or FOLLOWING is not supported.",
-          windowOrId
-      );
-    }
-
     boolean hasBounds = lowerBound != null || upperBound != null;
     if (call.getKind() == SqlKind.NTILE && hasBounds) {
       throw buildCalciteContextException(
@@ -162,7 +152,6 @@ public class DruidSqlValidator extends BaseDruidSqlValidator
       }
     }
 
-
     if (plannerContext.queryContext().isWindowingStrictValidation()) {
       if (!targetWindow.isRows() &&
           (!isUnboundedOrCurrent(lowerBound) || !isUnboundedOrCurrent(upperBound))) {
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/rel/Windowing.java b/sql/src/main/java/org/apache/druid/sql/calcite/rel/Windowing.java
index 4f0f0eda21b..afd775ef4ee 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/rel/Windowing.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/rel/Windowing.java
@@ -466,7 +466,9 @@ public class Windowing
       if (bound.isUnbounded() || bound.isCurrentRow()) {
         return 0;
       }
-      return getConstant(((RexInputRef) bound.getOffset()).getIndex());
+
+      final int value = getConstant(((RexInputRef) bound.getOffset()).getIndex());
+      return bound.isPreceding() ? -value : value;
     }
 
     private int getConstant(int refIndex)
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
index 9a0a0318210..ec40fb3f871 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
@@ -15561,26 +15561,6 @@ public class CalciteQueryTest extends BaseCalciteQueryTest
     assertThat(e, invalidSqlIs("Window frames with expression based lower/upper bounds are not supported. (line [1], column [31])"));
   }
 
-
-  @Test
-  public void testUnSupportedWindowBoundTypes()
-  {
-    assumeFeatureAvailable(EngineFeature.WINDOW_FUNCTIONS);
-
-    DruidException e;
-    e = assertThrows(DruidException.class, () -> testBuilder()
-        .queryContext(ImmutableMap.of(PlannerContext.CTX_ENABLE_WINDOW_FNS, true))
-        .sql("SELECT dim1,ROW_NUMBER() OVER (ORDER BY dim1 ROWS BETWEEN 1 PRECEDING AND 1 PRECEDING) from druid.foo")
-        .run());
-    assertThat(e, invalidSqlIs("Query bounds with both lower and upper bounds as PRECEDING or FOLLOWING is not supported. (line [1], column [31])"));
-
-    e = assertThrows(DruidException.class, () -> testBuilder()
-        .queryContext(ImmutableMap.of(PlannerContext.CTX_ENABLE_WINDOW_FNS, true))
-        .sql("SELECT dim1,ROW_NUMBER() OVER (ORDER BY dim1 ROWS BETWEEN 1 FOLLOWING AND 1 FOLLOWING) from druid.foo")
-        .run());
-    assertThat(e, invalidSqlIs("Query bounds with both lower and upper bounds as PRECEDING or FOLLOWING is not supported. (line [1], column [31])"));
-  }
-
   @Test
   public void testNtileNotSupportedWithFrame()
   {
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java
index f5e161b3a6a..cdc4bc9cbf9 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java
@@ -278,6 +278,52 @@ public class CalciteWindowQueryTest extends BaseCalciteQueryTest
         .run();
   }
 
+  @Test
+  public void testWindowAllBoundsCombination()
+  {
+    testBuilder()
+        .sql("select\n"
+             + "cityName,\n"
+             + "count(*) over (partition by cityName order by countryName rows between unbounded preceding and 1 preceding) c1,\n"
+             + "count(*) over (partition by cityName order by countryName rows between unbounded preceding and current row) c2,\n"
+             + "count(*) over (partition by cityName order by countryName rows between unbounded preceding and 1 following) c3,\n"
+             + "count(*) over (partition by cityName order by countryName rows between unbounded preceding and unbounded following) c4,\n"
+             + "count(*) over (partition by cityName order by countryName rows between 3 preceding and 1 preceding) c5,\n"
+             + "count(*) over (partition by cityName order by countryName rows between 1 preceding and current row) c6,\n"
+             + "count(*) over (partition by cityName order by countryName rows between 1 preceding and 1 FOLLOWING) c7,\n"
+             + "count(*) over (partition by cityName order by countryName rows between 1 preceding and unbounded FOLLOWING) c8,\n"
+             + "count(*) over (partition by cityName order by countryName rows between 1 FOLLOWING and unbounded FOLLOWING) c9,\n"
+             + "count(*) over (partition by cityName order by countryName rows between 1 FOLLOWING and 3 FOLLOWING) c10,\n"
+             + "count(*) over (partition by cityName order by countryName rows between current row and 1 following) c11,\n"
+             + "count(*) over (partition by cityName order by countryName rows between current row and unbounded following) c12\n"
+             + "from wikipedia\n"
+             + "where cityName in ('Vienna', 'Seoul')\n"
+             + "group by countryName, cityName, added")
+        .queryContext(ImmutableMap.of(
+            PlannerContext.CTX_ENABLE_WINDOW_FNS, true,
+            QueryContexts.ENABLE_DEBUG, true
+        ))
+        .expectedResults(ImmutableList.of(
+            new Object[]{"Seoul", 0L, 1L, 2L, 13L, 0L, 1L, 2L, 13L, 12L, 3L, 2L, 13L},
+            new Object[]{"Seoul", 1L, 2L, 3L, 13L, 1L, 2L, 3L, 13L, 11L, 3L, 2L, 12L},
+            new Object[]{"Seoul", 2L, 3L, 4L, 13L, 2L, 2L, 3L, 12L, 10L, 3L, 2L, 11L},
+            new Object[]{"Seoul", 3L, 4L, 5L, 13L, 3L, 2L, 3L, 11L, 9L, 3L, 2L, 10L},
+            new Object[]{"Seoul", 4L, 5L, 6L, 13L, 3L, 2L, 3L, 10L, 8L, 3L, 2L, 9L},
+            new Object[]{"Seoul", 5L, 6L, 7L, 13L, 3L, 2L, 3L, 9L, 7L, 3L, 2L, 8L},
+            new Object[]{"Seoul", 6L, 7L, 8L, 13L, 3L, 2L, 3L, 8L, 6L, 3L, 2L, 7L},
+            new Object[]{"Seoul", 7L, 8L, 9L, 13L, 3L, 2L, 3L, 7L, 5L, 3L, 2L, 6L},
+            new Object[]{"Seoul", 8L, 9L, 10L, 13L, 3L, 2L, 3L, 6L, 4L, 3L, 2L, 5L},
+            new Object[]{"Seoul", 9L, 10L, 11L, 13L, 3L, 2L, 3L, 5L, 3L, 3L, 2L, 4L},
+            new Object[]{"Seoul", 10L, 11L, 12L, 13L, 3L, 2L, 3L, 4L, 2L, 2L, 2L, 3L},
+            new Object[]{"Seoul", 11L, 12L, 13L, 13L, 3L, 2L, 3L, 3L, 1L, 1L, 2L, 2L},
+            new Object[]{"Seoul", 12L, 13L, 13L, 13L, 3L, 2L, 2L, 2L, 0L, 0L, 1L, 1L},
+            new Object[]{"Vienna", 0L, 1L, 2L, 3L, 0L, 1L, 2L, 3L, 2L, 2L, 2L, 3L},
+            new Object[]{"Vienna", 1L, 2L, 3L, 3L, 1L, 2L, 3L, 3L, 1L, 1L, 2L, 2L},
+            new Object[]{"Vienna", 2L, 3L, 3L, 3L, 2L, 2L, 2L, 2L, 0L, 0L, 1L, 1L}
+        ))
+        .run();
+  }
+
   private WindowOperatorQuery getWindowOperatorQuery(List<Query<?>> queries)
   {
     assertEquals(1, queries.size());
diff --git a/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrdering.sqlTest b/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrdering.sqlTest
index 221f7a52bcd..b8da0dbd658 100644
--- a/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrdering.sqlTest
+++ b/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrdering.sqlTest
@@ -18,7 +18,7 @@ expectedOperators:
       frame:
         peerType: "RANGE"
         lowUnbounded: false
-        lowOffset: 3
+        lowOffset: -3
         uppUnbounded: false
         uppOffset: 2
         orderBy:
diff --git a/sql/src/test/resources/calcite/tests/window/wikipediaFramedAggregations.sqlTest b/sql/src/test/resources/calcite/tests/window/wikipediaFramedAggregations.sqlTest
index 12e5736951b..07cfadfb680 100644
--- a/sql/src/test/resources/calcite/tests/window/wikipediaFramedAggregations.sqlTest
+++ b/sql/src/test/resources/calcite/tests/window/wikipediaFramedAggregations.sqlTest
@@ -17,7 +17,7 @@ expectedOperators:
       frame:
           peerType: "RANGE"
           lowUnbounded: false
-          lowOffset: 3
+          lowOffset: -3
           uppUnbounded: false
           uppOffset: 2
           orderBy: [ {column: "d1", direction: ASC} ]

From 354a3bea0b774d30266070f3c381719b99071c40 Mon Sep 17 00:00:00 2001
From: Misha <mikhailsviatohorof@gmail.com>
Date: Mon, 24 Jun 2024 17:52:35 +0200
Subject: [PATCH 15/72] The default `WHERE' filter for automatically generated
 SQL queries is returned (#16608)

* Returned the default `WHERE` filter for auto-generated SQL queries

* Checkstyle fix

---------

Co-authored-by: sviatahorau <mikhail.sviatahorau@deep.bi>
---
 web-console/src/views/workbench-view/workbench-view.tsx | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/web-console/src/views/workbench-view/workbench-view.tsx b/web-console/src/views/workbench-view/workbench-view.tsx
index c251a50f19a..625c6c514c6 100644
--- a/web-console/src/views/workbench-view/workbench-view.tsx
+++ b/web-console/src/views/workbench-view/workbench-view.tsx
@@ -20,6 +20,7 @@ import { Button, ButtonGroup, Intent, Menu, MenuDivider, MenuItem } from '@bluep
 import { IconNames } from '@blueprintjs/icons';
 import { Popover2 } from '@blueprintjs/popover2';
 import type { SqlQuery } from '@druid-toolkit/query';
+import { SqlExpression } from '@druid-toolkit/query';
 import classNames from 'classnames';
 import copy from 'copy-to-clipboard';
 import React from 'react';
@@ -63,6 +64,8 @@ import { WorkbenchHistoryDialog } from './workbench-history-dialog/workbench-his
 
 import './workbench-view.scss';
 
+const LAST_DAY = SqlExpression.parse(`__time >= CURRENT_TIMESTAMP - INTERVAL '1' DAY`);
+
 function cleanupTabEntry(tabEntry: TabEntry): void {
   const discardedId = tabEntry.id;
   WorkbenchRunningPromises.deletePromise(discardedId);
@@ -786,6 +789,7 @@ export class WorkbenchView extends React.PureComponent<WorkbenchViewProps, Workb
             columnMetadata={columnMetadataState.data}
             onQueryChange={this.handleSqlQueryChange}
             defaultSchema={defaultSchema ? defaultSchema : 'druid'}
+            defaultWhere={LAST_DAY}
             defaultTable={defaultTable}
             highlightTable={undefined}
           />

From 7463589b073c9eb07fe1c8fdbb725a1ca916091a Mon Sep 17 00:00:00 2001
From: Abhishek Radhakrishnan <abhishek.rb19@gmail.com>
Date: Mon, 24 Jun 2024 09:27:17 -0700
Subject: [PATCH 16/72] Support for bootstrap segments (#16609)

* Initial support for bootstrap segments.

  - Adds a new API in the coordinator.
  - All processes that have storage locations configured (including tasks)
    talk to the coordinator if they can, and fetch bootstrap segments from it.
  - Then load the segments onto the segment cache as part of startup.
  - This addresses the segment bootstrapping logic required by processes before
    they can start serving queries or ingesting.

    This patch also lays the foundation to speed up upgrades.

* Fail open by default if there are any errors talking to the coordinator.

* Add test for failure scenario and cleanup logs.

* Cleanup and add debug log

* Assert the events so we know the list exactly.

* Revert RunRules test.

The rules aren't evaluated if there are no clusters.

* Revert RunRulesTest too.

* Remove debug info.

* Make the API POST and update log.

* Fix up UTs.

* Throw 503 from MetadataResource; clean up exception handling and DruidException.

* Remove unused logger, add verification of metrics and docs.

* Update error message

* Update server/src/main/java/org/apache/druid/server/coordination/SegmentLoadDropHandler.java

Co-authored-by: Kashif Faraz <kashif.faraz@gmail.com>

* Apply suggestions from code review

Co-authored-by: Kashif Faraz <kashif.faraz@gmail.com>

* Adjust test metric expectations with the rename.

* Add BootstrapSegmentResponse container in the response for future extensibility.

* Rename to BootstrapSegmentsInfo for internal consistency.

* Remove unused log.

* Use a member variable for broadcast segments instead of segmentAssigner.

* Minor cleanup

* Add test for loadable bootstrap segments and clarify comment.

* Review suggestions.

---------

Co-authored-by: Kashif Faraz <kashif.faraz@gmail.com>
---
 docs/api-reference/legacy-metadata-api.md     |   6 +-
 .../apache/druid/error/DruidException.java    |   9 +-
 .../client/BootstrapSegmentsResponse.java     |  39 +++++++
 .../druid/client/JsonParserIterator.java      |  10 ++
 .../client/coordinator/CoordinatorClient.java |   7 ++
 .../coordinator/CoordinatorClientImpl.java    |  27 +++++
 .../rpc/indexing/OverlordClientImpl.java      |   3 -
 .../loading/LocalDataSegmentPuller.java       |   7 --
 .../coordination/LoadableDataSegment.java     |   4 +-
 .../coordination/SegmentLoadDropHandler.java  |  77 +++++++++++---
 .../server/coordinator/DruidCoordinator.java  |  17 +++
 .../DruidCoordinatorRuntimeParams.java        |   6 ++
 .../loading/StrategicSegmentAssigner.java     |   8 ++
 .../druid/server/http/MetadataResource.java   |  19 ++++
 .../CoordinatorClientImplTest.java            | 100 ++++++++++++++++++
 .../coordinator/NoopCoordinatorClient.java    |   7 ++
 .../SegmentLoadDropHandlerCacheTest.java      |  21 +++-
 .../SegmentLoadDropHandlerTest.java           |  97 +++++++++++++++--
 .../coordination/TestCoordinatorClient.java   |  53 ++++++++++
 .../coordination/ZkCoordinatorTest.java       |   4 +-
 .../coordinator/DruidCoordinatorTest.java     |   4 +
 .../server/http/MetadataResourceTest.java     |  29 +++++
 22 files changed, 509 insertions(+), 45 deletions(-)
 create mode 100644 server/src/main/java/org/apache/druid/client/BootstrapSegmentsResponse.java
 create mode 100644 server/src/test/java/org/apache/druid/server/coordination/TestCoordinatorClient.java

diff --git a/docs/api-reference/legacy-metadata-api.md b/docs/api-reference/legacy-metadata-api.md
index 453159c1a58..d22be18a7ec 100644
--- a/docs/api-reference/legacy-metadata-api.md
+++ b/docs/api-reference/legacy-metadata-api.md
@@ -176,7 +176,11 @@ Returns a list of all segments, overlapping with any of given intervals, for a d
 
 `POST /druid/coordinator/v1/metadata/dataSourceInformation`
 
-Returns information about the specified datasources, including the datasource schema.  
+Returns information about the specified datasources, including the datasource schema.
+
+`POST /druid/coordinator/v1/metadata/bootstrapSegments`
+
+Returns information about bootstrap segments for all datasources. The returned set includes all broadcast segments if broadcast rules are configured.
 
 <a name="coordinator-datasources"></a>
 
diff --git a/processing/src/main/java/org/apache/druid/error/DruidException.java b/processing/src/main/java/org/apache/druid/error/DruidException.java
index 555e7c67bb1..a04f3f6512c 100644
--- a/processing/src/main/java/org/apache/druid/error/DruidException.java
+++ b/processing/src/main/java/org/apache/druid/error/DruidException.java
@@ -331,19 +331,19 @@ public class DruidException extends RuntimeException
   }
 
   /**
-   * Category of error.  The simplest way to describe this is that it exists as a classification of errors that
+   * Category of error. The simplest way to describe this is that it exists as a classification of errors that
    * enables us to identify the expected response code (e.g. HTTP status code) of a specific DruidException
    */
   public enum Category
   {
     /**
      * Means that the exception is being created defensively, because we want to validate something but expect that
-     * it should never actually be hit.  Using this category is good to provide an indication to future reviewers and
+     * it should never actually be hit. Using this category is good to provide an indication to future reviewers and
      * developers that the case being checked is not intended to actually be able to occur in the wild.
      */
     DEFENSIVE(500),
     /**
-     * Means that the input provided was malformed in some way.  Generally speaking, it is hoped that errors of this
+     * Means that the input provided was malformed in some way. Generally speaking, it is hoped that errors of this
      * category have messages written either targeting the USER or ADMIN personas as those are the general users
      * of the APIs who could generate invalid inputs.
      */
@@ -356,9 +356,8 @@ public class DruidException extends RuntimeException
      * Means that an action that was attempted is forbidden
      */
     FORBIDDEN(403),
-
     /**
-     * Means that the requsted requested resource cannot be found.
+     * Means that the requested resource cannot be found.
      */
     NOT_FOUND(404),
     /**
diff --git a/server/src/main/java/org/apache/druid/client/BootstrapSegmentsResponse.java b/server/src/main/java/org/apache/druid/client/BootstrapSegmentsResponse.java
new file mode 100644
index 00000000000..7d156926242
--- /dev/null
+++ b/server/src/main/java/org/apache/druid/client/BootstrapSegmentsResponse.java
@@ -0,0 +1,39 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.client;
+
+import org.apache.druid.java.util.common.parsers.CloseableIterator;
+import org.apache.druid.timeline.DataSegment;
+
+public class BootstrapSegmentsResponse
+{
+  private final CloseableIterator<DataSegment> iterator;
+
+  public BootstrapSegmentsResponse(final CloseableIterator<DataSegment> iterator)
+  {
+    this.iterator = iterator;
+  }
+
+  public CloseableIterator<DataSegment> getIterator()
+  {
+    return iterator;
+  }
+
+}
diff --git a/server/src/main/java/org/apache/druid/client/JsonParserIterator.java b/server/src/main/java/org/apache/druid/client/JsonParserIterator.java
index 00dea3dff0e..7aa88774397 100644
--- a/server/src/main/java/org/apache/druid/client/JsonParserIterator.java
+++ b/server/src/main/java/org/apache/druid/client/JsonParserIterator.java
@@ -86,6 +86,16 @@ public class JsonParserIterator<T> implements CloseableIterator<T>
     this.hasTimeout = timeoutAt > -1;
   }
 
+  /**
+   * Bypasses Jackson serialization to prevent materialization of results from the {@code future} in memory at once.
+   * A shortened version of {@link #JsonParserIterator(JavaType, Future, String, Query, String, ObjectMapper)}
+   * where the URL and host parameters, used solely for logging/errors, are not known.
+   */
+  public JsonParserIterator(JavaType typeRef, Future<InputStream> future, ObjectMapper objectMapper)
+  {
+    this(typeRef, future, "", null, "", objectMapper);
+  }
+
   @Override
   public boolean hasNext()
   {
diff --git a/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClient.java b/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClient.java
index aeccee8043b..fdf16b2ac50 100644
--- a/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClient.java
+++ b/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClient.java
@@ -20,6 +20,7 @@
 package org.apache.druid.client.coordinator;
 
 import com.google.common.util.concurrent.ListenableFuture;
+import org.apache.druid.client.BootstrapSegmentsResponse;
 import org.apache.druid.client.ImmutableSegmentLoadInfo;
 import org.apache.druid.query.SegmentDescriptor;
 import org.apache.druid.rpc.ServiceRetryPolicy;
@@ -58,6 +59,12 @@ public interface CoordinatorClient
    */
   ListenableFuture<List<DataSourceInformation>> fetchDataSourceInformation(Set<String> datasources);
 
+  /**
+   * Fetch bootstrap segments from the coordinator. The results must be streamed back to the caller as the
+   * result set can be large.
+   */
+  ListenableFuture<BootstrapSegmentsResponse> fetchBootstrapSegments();
+
   /**
    * Returns a new instance backed by a ServiceClient which follows the provided retryPolicy
    */
diff --git a/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClientImpl.java b/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClientImpl.java
index 93c22bbdbff..4c795c9dbd4 100644
--- a/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClientImpl.java
+++ b/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClientImpl.java
@@ -21,17 +21,22 @@ package org.apache.druid.client.coordinator;
 
 import com.fasterxml.jackson.core.type.TypeReference;
 import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.util.concurrent.Futures;
 import com.google.common.util.concurrent.ListenableFuture;
+import org.apache.druid.client.BootstrapSegmentsResponse;
 import org.apache.druid.client.ImmutableSegmentLoadInfo;
+import org.apache.druid.client.JsonParserIterator;
 import org.apache.druid.common.guava.FutureUtils;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.jackson.JacksonUtils;
 import org.apache.druid.java.util.http.client.response.BytesFullResponseHandler;
+import org.apache.druid.java.util.http.client.response.InputStreamResponseHandler;
 import org.apache.druid.query.SegmentDescriptor;
 import org.apache.druid.rpc.RequestBuilder;
 import org.apache.druid.rpc.ServiceClient;
 import org.apache.druid.rpc.ServiceRetryPolicy;
 import org.apache.druid.segment.metadata.DataSourceInformation;
+import org.apache.druid.server.coordination.LoadableDataSegment;
 import org.apache.druid.timeline.DataSegment;
 import org.jboss.netty.handler.codec.http.HttpMethod;
 import org.joda.time.Interval;
@@ -156,6 +161,28 @@ public class CoordinatorClientImpl implements CoordinatorClient
     );
   }
 
+  @Override
+  public ListenableFuture<BootstrapSegmentsResponse> fetchBootstrapSegments()
+  {
+    final String path = "/druid/coordinator/v1/metadata/bootstrapSegments";
+    return FutureUtils.transform(
+        client.asyncRequest(
+            new RequestBuilder(HttpMethod.POST, path),
+            new InputStreamResponseHandler()
+        ),
+        in -> new BootstrapSegmentsResponse(
+            new JsonParserIterator<>(
+                // Some servers, like the Broker, may have PruneLoadSpec set to true for optimization reasons.
+                // We specifically use LoadableDataSegment here instead of DataSegment so the callers can still correctly
+                // load the bootstrap segments, as the load specs are guaranteed not to be pruned.
+                jsonMapper.getTypeFactory().constructType(LoadableDataSegment.class),
+                Futures.immediateFuture(in),
+                jsonMapper
+            )
+        )
+    );
+  }
+
   @Override
   public CoordinatorClientImpl withRetryPolicy(ServiceRetryPolicy retryPolicy)
   {
diff --git a/server/src/main/java/org/apache/druid/rpc/indexing/OverlordClientImpl.java b/server/src/main/java/org/apache/druid/rpc/indexing/OverlordClientImpl.java
index 35276aa723d..3e3d86ca5f2 100644
--- a/server/src/main/java/org/apache/druid/rpc/indexing/OverlordClientImpl.java
+++ b/server/src/main/java/org/apache/druid/rpc/indexing/OverlordClientImpl.java
@@ -323,9 +323,6 @@ public class OverlordClientImpl implements OverlordClient
     return new JsonParserIterator<>(
         jsonMapper.getTypeFactory().constructType(clazz),
         Futures.immediateFuture(in),
-        "", // We don't know URL at this point, but it's OK to use empty; it's used for logs/errors
-        null,
-        "", // We don't know host at this point, but it's OK to use empty; it's used for logs/errors
         jsonMapper
     );
   }
diff --git a/server/src/main/java/org/apache/druid/segment/loading/LocalDataSegmentPuller.java b/server/src/main/java/org/apache/druid/segment/loading/LocalDataSegmentPuller.java
index 0f27dac9e1b..27807a5c3c8 100644
--- a/server/src/main/java/org/apache/druid/segment/loading/LocalDataSegmentPuller.java
+++ b/server/src/main/java/org/apache/druid/segment/loading/LocalDataSegmentPuller.java
@@ -19,7 +19,6 @@
 
 package org.apache.druid.segment.loading;
 
-import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Predicate;
 import com.google.common.io.Files;
 import org.apache.druid.java.util.common.FileUtils;
@@ -117,12 +116,6 @@ public class LocalDataSegmentPuller implements URIDataPuller
 
   private static final Logger log = new Logger(LocalDataSegmentPuller.class);
 
-  @VisibleForTesting
-  public void getSegmentFiles(DataSegment segment, File dir) throws SegmentLoadingException
-  {
-    getSegmentFiles(getFile(segment), dir);
-  }
-
   public FileUtils.FileCopyResult getSegmentFiles(final File sourceFile, final File dir) throws SegmentLoadingException
   {
     if (sourceFile.isDirectory()) {
diff --git a/server/src/main/java/org/apache/druid/server/coordination/LoadableDataSegment.java b/server/src/main/java/org/apache/druid/server/coordination/LoadableDataSegment.java
index 4f4f7a5b1d1..2a633b6ad27 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/LoadableDataSegment.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/LoadableDataSegment.java
@@ -19,7 +19,6 @@
 
 package org.apache.druid.server.coordination;
 
-import com.fasterxml.jackson.annotation.JacksonInject;
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.fasterxml.jackson.databind.annotation.JsonDeserialize;
@@ -59,8 +58,7 @@ public class LoadableDataSegment extends DataSegment
       @JsonProperty("shardSpec") @Nullable ShardSpec shardSpec,
       @JsonProperty("lastCompactionState") @Nullable CompactionState lastCompactionState,
       @JsonProperty("binaryVersion") Integer binaryVersion,
-      @JsonProperty("size") long size,
-      @JacksonInject PruneSpecsHolder pruneSpecsHolder
+      @JsonProperty("size") long size
   )
   {
     super(
diff --git a/server/src/main/java/org/apache/druid/server/coordination/SegmentLoadDropHandler.java b/server/src/main/java/org/apache/druid/server/coordination/SegmentLoadDropHandler.java
index bcd88ee7ee9..4a9086ab572 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/SegmentLoadDropHandler.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/SegmentLoadDropHandler.java
@@ -29,6 +29,9 @@ import com.google.common.util.concurrent.AbstractFuture;
 import com.google.common.util.concurrent.ListenableFuture;
 import com.google.common.util.concurrent.SettableFuture;
 import com.google.inject.Inject;
+import org.apache.druid.client.BootstrapSegmentsResponse;
+import org.apache.druid.client.coordinator.CoordinatorClient;
+import org.apache.druid.common.guava.FutureUtils;
 import org.apache.druid.guice.ManageLifecycle;
 import org.apache.druid.guice.ServerTypeConfig;
 import org.apache.druid.java.util.common.ISE;
@@ -37,6 +40,8 @@ import org.apache.druid.java.util.common.concurrent.Execs;
 import org.apache.druid.java.util.common.lifecycle.LifecycleStart;
 import org.apache.druid.java.util.common.lifecycle.LifecycleStop;
 import org.apache.druid.java.util.emitter.EmittingLogger;
+import org.apache.druid.java.util.emitter.service.ServiceEmitter;
+import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.loading.SegmentLoadingException;
 import org.apache.druid.server.SegmentManager;
@@ -83,6 +88,8 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
   private final SegmentManager segmentManager;
   private final ScheduledExecutorService exec;
   private final ServerTypeConfig serverTypeConfig;
+  private final CoordinatorClient coordinatorClient;
+  private final ServiceEmitter emitter;
   private final ConcurrentSkipListSet<DataSegment> segmentsToDelete;
 
   private volatile boolean started = false;
@@ -103,7 +110,9 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
       DataSegmentAnnouncer announcer,
       DataSegmentServerAnnouncer serverAnnouncer,
       SegmentManager segmentManager,
-      ServerTypeConfig serverTypeConfig
+      ServerTypeConfig serverTypeConfig,
+      CoordinatorClient coordinatorClient,
+      ServiceEmitter emitter
   )
   {
     this(
@@ -115,7 +124,9 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
             config.getNumLoadingThreads(),
             Execs.makeThreadFactory("SimpleDataSegmentChangeHandler-%s")
         ),
-        serverTypeConfig
+        serverTypeConfig,
+        coordinatorClient,
+        emitter
     );
   }
 
@@ -126,7 +137,9 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
       DataSegmentServerAnnouncer serverAnnouncer,
       SegmentManager segmentManager,
       ScheduledExecutorService exec,
-      ServerTypeConfig serverTypeConfig
+      ServerTypeConfig serverTypeConfig,
+      CoordinatorClient coordinatorClient,
+      ServiceEmitter emitter
   )
   {
     this.config = config;
@@ -135,6 +148,8 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
     this.segmentManager = segmentManager;
     this.exec = exec;
     this.serverTypeConfig = serverTypeConfig;
+    this.coordinatorClient = coordinatorClient;
+    this.emitter = emitter;
 
     this.segmentsToDelete = new ConcurrentSkipListSet<>();
     requestStatuses = CacheBuilder.newBuilder().maximumSize(config.getStatusQueueMaxSize()).initialCapacity(8).build();
@@ -151,7 +166,7 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
       log.info("Starting...");
       try {
         if (segmentManager.canHandleSegments()) {
-          bootstrapCachedSegments();
+          loadSegmentsOnStartup();
         }
 
         if (shouldAnnounce()) {
@@ -207,12 +222,17 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
   }
 
   /**
-   * Bulk loading of cached segments into page cache during bootstrap.
+   * Bulk loading of the following segments into the page cache at startup:
+   * <li> Previously cached segments </li>
+   * <li> Bootstrap segments from the coordinator </li>
    */
-  private void bootstrapCachedSegments() throws IOException
+  private void loadSegmentsOnStartup() throws IOException
   {
+    final List<DataSegment> segmentsOnStartup = new ArrayList<>();
+    segmentsOnStartup.addAll(segmentManager.getCachedSegments());
+    segmentsOnStartup.addAll(getBootstrapSegments());
+
     final Stopwatch stopwatch = Stopwatch.createStarted();
-    final List<DataSegment> segments = segmentManager.getCachedSegments();
 
     // Start a temporary thread pool to load segments into page cache during bootstrap
     final ExecutorService loadingExecutor = Execs.multiThreaded(
@@ -224,11 +244,11 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
 
       backgroundSegmentAnnouncer.startAnnouncing();
 
-      final int numSegments = segments.size();
+      final int numSegments = segmentsOnStartup.size();
       final CountDownLatch latch = new CountDownLatch(numSegments);
       final AtomicInteger counter = new AtomicInteger(0);
       final CopyOnWriteArrayList<DataSegment> failedSegments = new CopyOnWriteArrayList<>();
-      for (final DataSegment segment : segments) {
+      for (final DataSegment segment : segmentsOnStartup) {
         loadingExecutor.submit(
             () -> {
               try {
@@ -269,7 +289,7 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
         latch.await();
 
         if (failedSegments.size() > 0) {
-          log.makeAlert("%,d errors seen while loading segments", failedSegments.size())
+          log.makeAlert("[%,d] errors seen while loading segments on startup", failedSegments.size())
              .addData("failedSegments", failedSegments)
              .emit();
         }
@@ -282,8 +302,8 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
       backgroundSegmentAnnouncer.finishAnnouncing();
     }
     catch (SegmentLoadingException e) {
-      log.makeAlert(e, "Failed to load segments -- likely problem with announcing.")
-         .addData("numSegments", segments.size())
+      log.makeAlert(e, "Failed to load segments on startup -- likely problem with announcing.")
+         .addData("numSegments", segmentsOnStartup.size())
          .emit();
     }
     finally {
@@ -292,10 +312,41 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
       // At this stage, all tasks have been submitted, send a shutdown command to cleanup any resources alloted
       // for the bootstrapping function.
       segmentManager.shutdownBootstrap();
-      log.info("Cache load of [%d] bootstrap segments took [%,d]ms.", segments.size(), stopwatch.millisElapsed());
+      log.info("Loaded [%d] segments on startup in [%,d]ms.", segmentsOnStartup.size(), stopwatch.millisElapsed());
     }
   }
 
+  /**
+   * @return a list of bootstrap segments. When bootstrap segments cannot be found, an empty list is returned.
+   */
+  private List<DataSegment> getBootstrapSegments()
+  {
+    log.info("Fetching bootstrap segments from the coordinator.");
+    final Stopwatch stopwatch = Stopwatch.createStarted();
+
+    List<DataSegment> bootstrapSegments = new ArrayList<>();
+
+    try {
+      final BootstrapSegmentsResponse response =
+          FutureUtils.getUnchecked(coordinatorClient.fetchBootstrapSegments(), true);
+      bootstrapSegments = ImmutableList.copyOf(response.getIterator());
+    }
+    catch (Exception e) {
+      // By default, we "fail open" when there is any error -- finding the coordinator, or if the API endpoint cannot
+      // be found during rolling upgrades, or even if it's irrecoverable.
+      log.warn("Error fetching bootstrap segments from the coordinator: [%s]. ", e.getMessage());
+    }
+    finally {
+      stopwatch.stop();
+      final long fetchRunMillis = stopwatch.millisElapsed();
+      emitter.emit(new ServiceMetricEvent.Builder().setMetric("segment/bootstrap/time", fetchRunMillis));
+      emitter.emit(new ServiceMetricEvent.Builder().setMetric("segment/bootstrap/count", bootstrapSegments.size()));
+      log.info("Fetched [%d] bootstrap segments in [%d]ms.", bootstrapSegments.size(), fetchRunMillis);
+    }
+
+    return bootstrapSegments;
+  }
+
   @Override
   public void addSegment(DataSegment segment, @Nullable DataSegmentChangeCallback callback)
   {
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinator.java b/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinator.java
index 0787bc8f7d4..36cfac8089c 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinator.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinator.java
@@ -174,6 +174,12 @@ public class DruidCoordinator
    */
   private volatile SegmentReplicationStatus segmentReplicationStatus = null;
 
+  /**
+   * Set of broadcast segments determined in the latest coordinator run of the {@link RunRules} duty.
+   * This might contain stale information if the Coordinator duties haven't run or are delayed.
+   */
+  private volatile Set<DataSegment> broadcastSegments = null;
+
   public static final String HISTORICAL_MANAGEMENT_DUTIES_DUTY_GROUP = "HistoricalManagementDuties";
   private static final String METADATA_STORE_MANAGEMENT_DUTIES_DUTY_GROUP = "MetadataStoreManagementDuties";
   private static final String INDEXING_SERVICE_DUTIES_DUTY_GROUP = "IndexingServiceDuties";
@@ -315,6 +321,16 @@ public class DruidCoordinator
     return loadStatus;
   }
 
+  /**
+   * @return Set of broadcast segments determined by the latest run of the {@link RunRules} duty.
+   * If the coordinator runs haven't triggered or are delayed, this information may be stale.
+   */
+  @Nullable
+  public Set<DataSegment> getBroadcastSegments()
+  {
+    return broadcastSegments;
+  }
+
   @Nullable
   public Integer getReplicationFactor(SegmentId segmentId)
   {
@@ -798,6 +814,7 @@ public class DruidCoordinator
     @Override
     public DruidCoordinatorRuntimeParams run(DruidCoordinatorRuntimeParams params)
     {
+      broadcastSegments = params.getBroadcastSegments();
       segmentReplicationStatus = params.getSegmentReplicationStatus();
 
       // Collect stats for unavailable and under-replicated segments
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinatorRuntimeParams.java b/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinatorRuntimeParams.java
index 5548636b000..ebdbd4f500e 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinatorRuntimeParams.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinatorRuntimeParams.java
@@ -123,6 +123,12 @@ public class DruidCoordinatorRuntimeParams
     return segmentAssigner == null ? null : segmentAssigner.getReplicationStatus();
   }
 
+  @Nullable
+  public Set<DataSegment> getBroadcastSegments()
+  {
+    return segmentAssigner == null ? null : segmentAssigner.getBroadcastSegments();
+  }
+
   public StrategicSegmentAssigner getSegmentAssigner()
   {
     return segmentAssigner;
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/loading/StrategicSegmentAssigner.java b/server/src/main/java/org/apache/druid/server/coordinator/loading/StrategicSegmentAssigner.java
index 1c2a867c4fa..9b5d38f198e 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/loading/StrategicSegmentAssigner.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/loading/StrategicSegmentAssigner.java
@@ -69,6 +69,7 @@ public class StrategicSegmentAssigner implements SegmentActionHandler
   private final Map<String, Integer> tierToHistoricalCount = new HashMap<>();
   private final Map<String, Set<SegmentId>> segmentsToDelete = new HashMap<>();
   private final Map<String, Set<DataSegment>> segmentsWithZeroRequiredReplicas = new HashMap<>();
+  private final Set<DataSegment> broadcastSegments = new HashSet<>();
 
   public StrategicSegmentAssigner(
       SegmentLoadQueueManager loadQueueManager,
@@ -361,6 +362,8 @@ public class StrategicSegmentAssigner implements SegmentActionHandler
         entry -> replicaCountMap.computeIfAbsent(segment.getId(), entry.getKey())
                                 .setRequired(entry.getIntValue(), entry.getIntValue())
     );
+
+    broadcastSegments.add(segment);
   }
 
   @Override
@@ -398,6 +401,11 @@ public class StrategicSegmentAssigner implements SegmentActionHandler
     return false;
   }
 
+  public Set<DataSegment> getBroadcastSegments()
+  {
+    return broadcastSegments;
+  }
+
   /**
    * Drops the broadcast segment if it is loaded on the given server.
    * Returns true only if the segment was successfully queued for drop on the server.
diff --git a/server/src/main/java/org/apache/druid/server/http/MetadataResource.java b/server/src/main/java/org/apache/druid/server/http/MetadataResource.java
index d8b00c318db..a1cccd2b784 100644
--- a/server/src/main/java/org/apache/druid/server/http/MetadataResource.java
+++ b/server/src/main/java/org/apache/druid/server/http/MetadataResource.java
@@ -471,4 +471,23 @@ public class MetadataResource
     );
     return Response.status(Response.Status.OK).entity(authorizedDataSourceInformation).build();
   }
+
+  /**
+   * @return all bootstrap segments determined by the coordinator.
+   */
+  @POST
+  @Path("/bootstrapSegments")
+  @Produces(MediaType.APPLICATION_JSON)
+  @ResourceFilters(DatasourceResourceFilter.class)
+  public Response getBootstrapSegments()
+  {
+    final Set<DataSegment> broadcastSegments = coordinator.getBroadcastSegments();
+    if (broadcastSegments == null) {
+      return Response.status(Response.Status.SERVICE_UNAVAILABLE)
+                     .entity("Bootstrap segments are not initialized yet."
+                         + " Please ensure that the Coordinator duties are running and try again.")
+                     .build();
+    }
+    return Response.status(Response.Status.OK).entity(broadcastSegments).build();
+  }
 }
diff --git a/server/src/test/java/org/apache/druid/client/coordinator/CoordinatorClientImplTest.java b/server/src/test/java/org/apache/druid/client/coordinator/CoordinatorClientImplTest.java
index 62af96d4e0e..3dde6dda149 100644
--- a/server/src/test/java/org/apache/druid/client/coordinator/CoordinatorClientImplTest.java
+++ b/server/src/test/java/org/apache/druid/client/coordinator/CoordinatorClientImplTest.java
@@ -24,7 +24,12 @@ import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
+import com.google.common.util.concurrent.ListenableFuture;
+import com.google.inject.Injector;
+import org.apache.druid.client.BootstrapSegmentsResponse;
 import org.apache.druid.client.ImmutableSegmentLoadInfo;
+import org.apache.druid.guice.StartupInjectorBuilder;
+import org.apache.druid.initialization.CoreInjectorBuilder;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.StringUtils;
@@ -37,6 +42,7 @@ import org.apache.druid.segment.metadata.DataSourceInformation;
 import org.apache.druid.server.coordination.DruidServerMetadata;
 import org.apache.druid.server.coordination.ServerType;
 import org.apache.druid.timeline.DataSegment;
+import org.apache.druid.timeline.PruneLoadSpec;
 import org.apache.druid.timeline.partition.NumberedShardSpec;
 import org.jboss.netty.handler.codec.http.HttpMethod;
 import org.jboss.netty.handler.codec.http.HttpResponseStatus;
@@ -58,6 +64,24 @@ public class CoordinatorClientImplTest
   private MockServiceClient serviceClient;
   private CoordinatorClient coordinatorClient;
 
+  private static final DataSegment SEGMENT1 = DataSegment.builder()
+                                                         .dataSource("xyz")
+                                                         .interval(Intervals.of("1000/2000"))
+                                                         .version("1")
+                                                         .loadSpec(ImmutableMap.of("type", "local", "loc", "foo"))
+                                                         .shardSpec(new NumberedShardSpec(0, 1))
+                                                         .size(1)
+                                                         .build();
+
+  private static final DataSegment SEGMENT2 = DataSegment.builder()
+                                                         .dataSource("xyz")
+                                                         .interval(Intervals.of("2000/3000"))
+                                                         .version("1")
+                                                         .loadSpec(ImmutableMap.of("type", "local", "loc", "bar"))
+                                                         .shardSpec(new NumberedShardSpec(0, 1))
+                                                         .size(1)
+                                                         .build();
+
   @Before
   public void setup()
   {
@@ -181,6 +205,82 @@ public class CoordinatorClientImplTest
     );
   }
 
+  @Test
+  public void test_fetchBootstrapSegments() throws Exception
+  {
+    final List<DataSegment> expectedSegments = ImmutableList.of(SEGMENT1, SEGMENT2);
+
+    serviceClient.expectAndRespond(
+        new RequestBuilder(HttpMethod.POST, "/druid/coordinator/v1/metadata/bootstrapSegments"),
+        HttpResponseStatus.OK,
+        ImmutableMap.of(HttpHeaders.CONTENT_TYPE, MediaType.APPLICATION_JSON),
+        jsonMapper.writeValueAsBytes(expectedSegments)
+    );
+
+    final ListenableFuture<BootstrapSegmentsResponse> response = coordinatorClient.fetchBootstrapSegments();
+    Assert.assertNotNull(response);
+
+    final ImmutableList<DataSegment> observedDataSegments = ImmutableList.copyOf(response.get().getIterator());
+    for (int idx = 0; idx < expectedSegments.size(); idx++) {
+      Assert.assertEquals(expectedSegments.get(idx).getLoadSpec(), observedDataSegments.get(idx).getLoadSpec());
+    }
+  }
+
+  /**
+   * Set up a Guice injector with PruneLoadSpec set to true. This test verifies that the bootstrap segments API
+   * always return segments with load specs present, ensuring they can be loaded anywhere.
+   */
+  @Test
+  public void test_fetchBootstrapSegmentsAreLoadableWhenPruneLoadSpecIsEnabled() throws Exception
+  {
+    final List<DataSegment> expectedSegments = ImmutableList.of(SEGMENT1, SEGMENT2);
+
+    // Set up a coordinator client with PruneLoadSpec set to true in the injector
+    final Injector injector = new CoreInjectorBuilder(new StartupInjectorBuilder().build())
+        .addModule(binder -> binder.bindConstant().annotatedWith(PruneLoadSpec.class).to(true))
+        .build();
+
+    final ObjectMapper objectMapper = injector.getInstance(ObjectMapper.class);
+    final CoordinatorClient coordinatorClient = new CoordinatorClientImpl(serviceClient, objectMapper);
+
+    serviceClient.expectAndRespond(
+        new RequestBuilder(HttpMethod.POST, "/druid/coordinator/v1/metadata/bootstrapSegments"),
+        HttpResponseStatus.OK,
+        ImmutableMap.of(HttpHeaders.CONTENT_TYPE, MediaType.APPLICATION_JSON),
+        objectMapper.writeValueAsBytes(expectedSegments)
+    );
+
+    final ListenableFuture<BootstrapSegmentsResponse> response = coordinatorClient.fetchBootstrapSegments();
+    Assert.assertNotNull(response);
+
+    final ImmutableList<DataSegment> observedDataSegments = ImmutableList.copyOf(response.get().getIterator());
+    Assert.assertEquals(expectedSegments, observedDataSegments);
+    for (int idx = 0; idx < expectedSegments.size(); idx++) {
+      Assert.assertEquals(expectedSegments.get(idx).getLoadSpec(), observedDataSegments.get(idx).getLoadSpec());
+    }
+  }
+
+  @Test
+  public void test_fetchEmptyBootstrapSegments() throws Exception
+  {
+    final List<DataSegment> segments = ImmutableList.of();
+
+    serviceClient.expectAndRespond(
+        new RequestBuilder(HttpMethod.POST, "/druid/coordinator/v1/metadata/bootstrapSegments"),
+        HttpResponseStatus.OK,
+        ImmutableMap.of(HttpHeaders.CONTENT_TYPE, MediaType.APPLICATION_JSON),
+        jsonMapper.writeValueAsBytes(segments)
+    );
+
+    final ListenableFuture<BootstrapSegmentsResponse> response = coordinatorClient.fetchBootstrapSegments();
+    Assert.assertNotNull(response);
+
+    Assert.assertEquals(
+        segments,
+        ImmutableList.copyOf(response.get().getIterator())
+    );
+  }
+
   @Test
   public void test_fetchDataSourceInformation() throws Exception
   {
diff --git a/server/src/test/java/org/apache/druid/client/coordinator/NoopCoordinatorClient.java b/server/src/test/java/org/apache/druid/client/coordinator/NoopCoordinatorClient.java
index 7b7d253ef6d..5aee343a851 100644
--- a/server/src/test/java/org/apache/druid/client/coordinator/NoopCoordinatorClient.java
+++ b/server/src/test/java/org/apache/druid/client/coordinator/NoopCoordinatorClient.java
@@ -20,6 +20,7 @@
 package org.apache.druid.client.coordinator;
 
 import com.google.common.util.concurrent.ListenableFuture;
+import org.apache.druid.client.BootstrapSegmentsResponse;
 import org.apache.druid.client.ImmutableSegmentLoadInfo;
 import org.apache.druid.query.SegmentDescriptor;
 import org.apache.druid.rpc.ServiceRetryPolicy;
@@ -62,6 +63,12 @@ public class NoopCoordinatorClient implements CoordinatorClient
     throw new UnsupportedOperationException();
   }
 
+  @Override
+  public ListenableFuture<BootstrapSegmentsResponse> fetchBootstrapSegments()
+  {
+    throw new UnsupportedOperationException();
+  }
+
   @Override
   public CoordinatorClient withRetryPolicy(ServiceRetryPolicy retryPolicy)
   {
diff --git a/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerCacheTest.java b/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerCacheTest.java
index b7ce3b8e058..f6b1c39c59d 100644
--- a/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerCacheTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerCacheTest.java
@@ -23,6 +23,8 @@ import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
 import org.apache.druid.guice.ServerTypeConfig;
 import org.apache.druid.java.util.emitter.EmittingLogger;
+import org.apache.druid.java.util.emitter.service.ServiceEmitter;
+import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.TestIndex;
 import org.apache.druid.segment.loading.DataSegmentPusher;
@@ -34,7 +36,6 @@ import org.apache.druid.segment.loading.StorageLocation;
 import org.apache.druid.segment.loading.StorageLocationConfig;
 import org.apache.druid.server.SegmentManager;
 import org.apache.druid.server.TestSegmentUtils;
-import org.apache.druid.server.metrics.NoopServiceEmitter;
 import org.apache.druid.timeline.DataSegment;
 import org.junit.Assert;
 import org.junit.Before;
@@ -63,6 +64,8 @@ public class SegmentLoadDropHandlerCacheTest
   private SegmentManager segmentManager;
   private SegmentLoaderConfig loaderConfig;
   private SegmentLocalCacheManager cacheManager;
+  private TestCoordinatorClient coordinatorClient;
+  private ServiceEmitter emitter;
   private ObjectMapper objectMapper;
 
   @Before
@@ -100,7 +103,9 @@ public class SegmentLoadDropHandlerCacheTest
     segmentManager = new SegmentManager(cacheManager);
     segmentAnnouncer = new TestDataSegmentAnnouncer();
     serverAnnouncer = new TestDataServerAnnouncer();
-    EmittingLogger.registerEmitter(new NoopServiceEmitter());
+    coordinatorClient = new TestCoordinatorClient();
+    emitter = new StubServiceEmitter();
+    EmittingLogger.registerEmitter(emitter);
   }
 
   @Test
@@ -122,7 +127,9 @@ public class SegmentLoadDropHandlerCacheTest
         segmentAnnouncer,
         serverAnnouncer,
         segmentManager,
-        new ServerTypeConfig(ServerType.BROKER)
+        new ServerTypeConfig(ServerType.BROKER),
+        coordinatorClient,
+        emitter
     );
 
     loadDropHandler.start();
@@ -140,7 +147,9 @@ public class SegmentLoadDropHandlerCacheTest
         segmentAnnouncer,
         serverAnnouncer,
         segmentManager,
-        new ServerTypeConfig(ServerType.BROKER)
+        new ServerTypeConfig(ServerType.BROKER),
+        coordinatorClient,
+        emitter
     );
 
     loadDropHandler.start();
@@ -171,7 +180,9 @@ public class SegmentLoadDropHandlerCacheTest
         segmentAnnouncer,
         serverAnnouncer,
         segmentManager,
-        new ServerTypeConfig(ServerType.HISTORICAL)
+        new ServerTypeConfig(ServerType.HISTORICAL),
+        coordinatorClient,
+        emitter
     );
 
     // Start the load drop handler
diff --git a/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerTest.java b/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerTest.java
index 1a776c6c34a..9fe04d60d5b 100644
--- a/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerTest.java
@@ -22,12 +22,15 @@ package org.apache.druid.server.coordination;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableSet;
 import com.google.common.util.concurrent.ListenableFuture;
+import org.apache.druid.client.coordinator.CoordinatorClient;
+import org.apache.druid.client.coordinator.NoopCoordinatorClient;
 import org.apache.druid.guice.ServerTypeConfig;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.MapUtils;
 import org.apache.druid.java.util.common.concurrent.Execs;
 import org.apache.druid.java.util.common.concurrent.ScheduledExecutorFactory;
 import org.apache.druid.java.util.emitter.EmittingLogger;
+import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.apache.druid.segment.ReferenceCountingSegment;
 import org.apache.druid.segment.SegmentLazyLoadFailCallback;
 import org.apache.druid.segment.loading.NoopSegmentCacheManager;
@@ -37,7 +40,6 @@ import org.apache.druid.segment.loading.TombstoneSegmentizerFactory;
 import org.apache.druid.server.SegmentManager;
 import org.apache.druid.server.TestSegmentUtils;
 import org.apache.druid.server.coordination.SegmentChangeStatus.State;
-import org.apache.druid.server.metrics.NoopServiceEmitter;
 import org.apache.druid.timeline.DataSegment;
 import org.joda.time.Interval;
 import org.junit.Assert;
@@ -72,6 +74,8 @@ public class SegmentLoadDropHandlerTest
   private List<Runnable> scheduledRunnable;
   private SegmentLoaderConfig segmentLoaderConfig;
   private ScheduledExecutorFactory scheduledExecutorFactory;
+  private TestCoordinatorClient coordinatorClient;
+  private StubServiceEmitter serviceEmitter;
 
   @Rule
   public ExpectedException expectedException = ExpectedException.none();
@@ -136,7 +140,9 @@ public class SegmentLoadDropHandlerTest
       };
     };
 
-    EmittingLogger.registerEmitter(new NoopServiceEmitter());
+    coordinatorClient = new TestCoordinatorClient();
+    serviceEmitter = new StubServiceEmitter();
+    EmittingLogger.registerEmitter(serviceEmitter);
   }
 
   /**
@@ -293,6 +299,71 @@ public class SegmentLoadDropHandlerTest
     Assert.assertEquals(1, cacheManager.observedShutdownBootstrapCount.get());
   }
 
+  @Test
+  public void testLoadBootstrapSegments() throws Exception
+  {
+    final Set<DataSegment> segments = new HashSet<>();
+    for (int i = 0; i < COUNT; ++i) {
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-01")));
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-02")));
+      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-01")));
+      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-02")));
+    }
+
+    final TestCoordinatorClient coordinatorClient = new TestCoordinatorClient(segments);
+    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager();
+    final SegmentManager segmentManager = new SegmentManager(cacheManager);
+
+    final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager, coordinatorClient);
+
+    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
+
+    handler.start();
+
+    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
+    Assert.assertFalse(segmentManager.getDataSourceCounts().isEmpty());
+
+    for (int i = 0; i < COUNT; ++i) {
+      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test" + i).longValue());
+      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test_two" + i).longValue());
+    }
+
+    final ImmutableList<DataSegment> expectedBootstrapSegments = ImmutableList.copyOf(segments);
+
+    Assert.assertEquals(expectedBootstrapSegments, segmentAnnouncer.getObservedSegments());
+
+    Assert.assertEquals(expectedBootstrapSegments, cacheManager.observedBootstrapSegments);
+    Assert.assertEquals(expectedBootstrapSegments, cacheManager.observedBootstrapSegmentsLoadedIntoPageCache);
+    serviceEmitter.verifyValue("segment/bootstrap/count", expectedBootstrapSegments.size());
+    serviceEmitter.verifyEmitted("segment/bootstrap/time", 1);
+
+    handler.stop();
+  }
+
+  @Test
+  public void testLoadBootstrapSegmentsWhenExceptionThrown() throws Exception
+  {
+    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager();
+    final SegmentManager segmentManager = new SegmentManager(cacheManager);
+
+    final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager, new NoopCoordinatorClient());
+
+    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
+
+    handler.start();
+
+    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
+    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
+
+    Assert.assertEquals(ImmutableList.of(), segmentAnnouncer.getObservedSegments());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegments);
+    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegmentsLoadedIntoPageCache);
+    serviceEmitter.verifyValue("segment/bootstrap/count", 0);
+    serviceEmitter.verifyEmitted("segment/bootstrap/time", 1);
+
+    handler.stop();
+  }
+
   @Test
   public void testStartStop() throws Exception
   {
@@ -467,7 +538,8 @@ public class SegmentLoadDropHandlerTest
 
     final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(
         noAnnouncerSegmentLoaderConfig,
-        segmentManager
+        segmentManager,
+        coordinatorClient
     );
 
     handler.start();
@@ -543,12 +615,21 @@ public class SegmentLoadDropHandlerTest
     Assert.assertEquals(0, serverAnnouncer.getObservedCount());
   }
 
-  private SegmentLoadDropHandler initSegmentLoadDropHandler(SegmentManager segmentManager)
+  private SegmentLoadDropHandler initSegmentLoadDropHandler(SegmentManager segmentManager, CoordinatorClient coordinatorClient)
   {
-    return initSegmentLoadDropHandler(segmentLoaderConfig, segmentManager);
+    return initSegmentLoadDropHandler(segmentLoaderConfig, segmentManager, coordinatorClient);
   }
 
-  private SegmentLoadDropHandler initSegmentLoadDropHandler(SegmentLoaderConfig config, SegmentManager segmentManager)
+  private SegmentLoadDropHandler initSegmentLoadDropHandler(SegmentManager segmentManager)
+  {
+    return initSegmentLoadDropHandler(segmentLoaderConfig, segmentManager, coordinatorClient);
+  }
+
+  private SegmentLoadDropHandler initSegmentLoadDropHandler(
+      SegmentLoaderConfig config,
+      SegmentManager segmentManager,
+      CoordinatorClient coordinatorClient
+  )
   {
     return new SegmentLoadDropHandler(
         config,
@@ -556,7 +637,9 @@ public class SegmentLoadDropHandlerTest
         serverAnnouncer,
         segmentManager,
         scheduledExecutorFactory.create(5, "SegmentLoadDropHandlerTest-[%d]"),
-        new ServerTypeConfig(ServerType.HISTORICAL)
+        new ServerTypeConfig(ServerType.HISTORICAL),
+        coordinatorClient,
+        serviceEmitter
     );
   }
 
diff --git a/server/src/test/java/org/apache/druid/server/coordination/TestCoordinatorClient.java b/server/src/test/java/org/apache/druid/server/coordination/TestCoordinatorClient.java
new file mode 100644
index 00000000000..9f297ddd39e
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/server/coordination/TestCoordinatorClient.java
@@ -0,0 +1,53 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.server.coordination;
+
+import com.google.common.util.concurrent.Futures;
+import com.google.common.util.concurrent.ListenableFuture;
+import org.apache.druid.client.BootstrapSegmentsResponse;
+import org.apache.druid.client.coordinator.NoopCoordinatorClient;
+import org.apache.druid.java.util.common.CloseableIterators;
+import org.apache.druid.timeline.DataSegment;
+
+import java.util.HashSet;
+import java.util.Set;
+
+class TestCoordinatorClient extends NoopCoordinatorClient
+{
+  private final Set<DataSegment> bootstrapSegments;
+
+  TestCoordinatorClient()
+  {
+    this(new HashSet<>());
+  }
+
+  TestCoordinatorClient(final Set<DataSegment> bootstrapSegments)
+  {
+    this.bootstrapSegments = bootstrapSegments;
+  }
+
+  @Override
+  public ListenableFuture<BootstrapSegmentsResponse> fetchBootstrapSegments()
+  {
+    return Futures.immediateFuture(
+        new BootstrapSegmentsResponse(CloseableIterators.withEmptyBaggage(bootstrapSegments.iterator()))
+    );
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/server/coordination/ZkCoordinatorTest.java b/server/src/test/java/org/apache/druid/server/coordination/ZkCoordinatorTest.java
index f0f2bd3b4e4..9f5291af598 100644
--- a/server/src/test/java/org/apache/druid/server/coordination/ZkCoordinatorTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordination/ZkCoordinatorTest.java
@@ -106,7 +106,9 @@ public class ZkCoordinatorTest extends CuratorTestBase
         EasyMock.createNiceMock(DataSegmentServerAnnouncer.class),
         EasyMock.createNiceMock(SegmentManager.class),
         EasyMock.createNiceMock(ScheduledExecutorService.class),
-        new ServerTypeConfig(ServerType.HISTORICAL)
+        new ServerTypeConfig(ServerType.HISTORICAL),
+        new TestCoordinatorClient(),
+        new NoopServiceEmitter()
     )
     {
       @Override
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/DruidCoordinatorTest.java b/server/src/test/java/org/apache/druid/server/coordinator/DruidCoordinatorTest.java
index a5ed1616a6d..8c7e0ae14e5 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/DruidCoordinatorTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/DruidCoordinatorTest.java
@@ -82,6 +82,7 @@ import org.junit.Test;
 
 import javax.annotation.Nullable;
 import java.util.Collections;
+import java.util.HashSet;
 import java.util.List;
 import java.util.Map;
 import java.util.concurrent.CountDownLatch;
@@ -266,6 +267,7 @@ public class DruidCoordinatorTest extends CuratorTestBase
     coordinator.start();
 
     Assert.assertNull(coordinator.getReplicationFactor(dataSegment.getId()));
+    Assert.assertNull(coordinator.getBroadcastSegments());
 
     // Wait for this coordinator to become leader
     leaderAnnouncerLatch.await();
@@ -293,6 +295,7 @@ public class DruidCoordinatorTest extends CuratorTestBase
         coordinator.getDatasourceToUnavailableSegmentCount();
     Assert.assertEquals(1, numsUnavailableUsedSegmentsPerDataSource.size());
     Assert.assertEquals(0, numsUnavailableUsedSegmentsPerDataSource.getInt(dataSource));
+    Assert.assertEquals(0, coordinator.getBroadcastSegments().size());
 
     Map<String, Object2LongMap<String>> underReplicationCountsPerDataSourcePerTier =
         coordinator.getTierToDatasourceToUnderReplicatedCount(false);
@@ -571,6 +574,7 @@ public class DruidCoordinatorTest extends CuratorTestBase
     coordinatorRunLatch.await();
 
     Assert.assertEquals(ImmutableMap.of(dataSource, 100.0), coordinator.getDatasourceToLoadStatus());
+    Assert.assertEquals(new HashSet<>(dataSegments.values()), coordinator.getBroadcastSegments());
 
     // Under-replicated counts are updated only after the next coordinator run
     Map<String, Object2LongMap<String>> underReplicationCountsPerDataSourcePerTier =
diff --git a/server/src/test/java/org/apache/druid/server/http/MetadataResourceTest.java b/server/src/test/java/org/apache/druid/server/http/MetadataResourceTest.java
index 1b86bbca453..4d6bbf5929b 100644
--- a/server/src/test/java/org/apache/druid/server/http/MetadataResourceTest.java
+++ b/server/src/test/java/org/apache/druid/server/http/MetadataResourceTest.java
@@ -486,6 +486,35 @@ public class MetadataResourceTest
     );
   }
 
+  @Test
+  public void testGetBootstrapSegments()
+  {
+    Mockito.doReturn(ImmutableSet.of(segments[0], segments[1])).when(coordinator).getBroadcastSegments();
+
+    Response response = metadataResource.getBootstrapSegments();
+    final List<DataSegment> observedSegments = extractResponseList(response);
+    Assert.assertEquals(2, observedSegments.size());
+  }
+
+  @Test
+  public void testEmptyGetBootstrapSegments()
+  {
+    Mockito.doReturn(ImmutableSet.of()).when(coordinator).getBroadcastSegments();
+
+    Response response = metadataResource.getBootstrapSegments();
+    final List<DataSegment> observedSegments = extractResponseList(response);
+    Assert.assertEquals(0, observedSegments.size());
+  }
+
+  @Test
+  public void testNullGetBootstrapSegments()
+  {
+    Mockito.doReturn(null).when(coordinator).getBroadcastSegments();
+
+    Response response = metadataResource.getBootstrapSegments();
+    Assert.assertEquals(503, response.getStatus());
+  }
+
   private <T> List<T> extractResponseList(Response response)
   {
     return Lists.newArrayList(

From 2131917f169a57e3ffd3774821410aa046e34bf1 Mon Sep 17 00:00:00 2001
From: 317brian <53799971+317brian@users.noreply.github.com>
Date: Mon, 24 Jun 2024 10:52:26 -0700
Subject: [PATCH 17/72] docs: added front-coded dictionaries to upgrade notes
 (#16647)

* docs: add front-coded dictionareis to upgrade notes

* add it to release notes template
---
 docs/release-info/release-notes.md | 13 +++++++++++++
 docs/release-info/upgrade-notes.md | 12 ++++++++++++
 2 files changed, 25 insertions(+)

diff --git a/docs/release-info/release-notes.md b/docs/release-info/release-notes.md
index 768ceef697b..82e371e8406 100644
--- a/docs/release-info/release-notes.md
+++ b/docs/release-info/release-notes.md
@@ -97,6 +97,19 @@ This section contains detailed release notes separated by areas.
 
 ### Upgrade notes
 
+#### Front-coded dictionaries
+
+<!--Carry this forward until 32. Then move it to incompatible changes -->
+
+In Druid 32.0.0, the front coded dictionaries feature will be turned on by default. Front-coded dictionaries reduce storage and improve performance by optimizing for strings where the front part looks similar.
+
+Once this feature is on, you cannot easily downgrade to an earlier version that does not support the feature. 
+
+For more information, see [Migration guide: front-coded dictionaries](./migr-front-coded-dict.md).
+
+If you're already using this feature, you don't need to take any action. 
+
+
 ### Incompatible changes
 
 ### Developer notes
diff --git a/docs/release-info/upgrade-notes.md b/docs/release-info/upgrade-notes.md
index fd622f21ea3..52adccabbc7 100644
--- a/docs/release-info/upgrade-notes.md
+++ b/docs/release-info/upgrade-notes.md
@@ -26,6 +26,18 @@ The upgrade notes assume that you are upgrading from the Druid version that imme
 
 For the full release notes for a specific version, see the [releases page](https://github.com/apache/druid/releases).
 
+## Announcements
+
+#### Front-coded dictionaries
+
+In Druid 32.0.0, the front coded dictionaries feature will be turned on by default. Front-coded dictionaries reduce storage and improve performance by optimizing for strings where the front part looks similar.
+
+Once this feature is on, you cannot easily downgrade to an earlier version that does not support the feature. 
+
+For more information, see [Migration guide: front-coded dictionaries](./migr-front-coded-dict.md).
+
+If you're already using this feature, you don't need to take any action. 
+
 ## 30.0.0
 
 ### Upgrade notes

From 37a50e680349aae76a418236285eabb260ef6729 Mon Sep 17 00:00:00 2001
From: Clint Wylie <cwylie@apache.org>
Date: Mon, 24 Jun 2024 20:13:33 -0700
Subject: [PATCH 18/72] Remove index_realtime and index_realtime_appenderator
 tasks (#16602)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

index_realtime tasks were removed from the documentation in #13107. Even
at that time, they weren't really documented per se— just mentioned. They
existed solely to support Tranquility, which is an obsolete ingestion
method that predates migration of Druid to ASF and is no longer being
maintained. Tranquility docs were also de-linked from the sidebars and
the other doc pages in #11134. Only a stub remains, so people with
links to the page can see that it's no longer recommended.

index_realtime_appenderator tasks existed in the code base, but were
never documented, nor as far as I am aware were they used for any purpose.

This patch removes both task types completely, as well as removes all
supporting code that was otherwise unused. It also updates the stub
doc for Tranquility to be firmer that it is not compatible. (Previously,
the stub doc said it wasn't recommended, and pointed out that it is
built against an ancient 0.9.2 version of Druid.)

ITUnionQueryTest has been migrated to the new integration tests framework and updated to use Kafka ingestion.

Co-authored-by: Gian Merlino <gianmerlino@gmail.com>
---
 .github/workflows/revised-its.yml             |    2 +-
 distribution/bin/tag-missing-milestones.py    |    3 +-
 docs/ingestion/tranquility.md                 |   10 +-
 .../MaterializedViewSupervisorTest.java       |    9 +-
 .../DatasourceOptimizerTest.java              |   18 +-
 .../bloom/BloomFilterAggregatorTest.java      |    1 -
 .../druid/security/pac4j/Pac4jFilter.java     |    1 -
 .../indexing/kafka/KafkaIndexTaskTest.java    |    6 +-
 .../kafka/supervisor/KafkaSupervisorTest.java |   16 +-
 .../supervisor/KinesisSupervisorTest.java     |   16 +-
 .../SegmentGeneratorMetricsWrapper.java       |    6 +-
 .../druid/msq/test/CalciteMSQTestsHelper.java |    1 -
 .../TaskRealtimeMetricsMonitorBuilder.java    |   22 +-
 .../RealtimeAppenderatorIngestionSpec.java    |   40 -
 .../RealtimeAppenderatorTuningConfig.java     |  357 ----
 .../stats/TaskRealtimeMetricsMonitor.java     |   47 +-
 .../AppenderatorDriverRealtimeIndexTask.java  |  853 ---------
 .../common/task/BatchAppenderators.java       |    6 +-
 .../druid/indexing/common/task/IndexTask.java |   18 +-
 .../common/task/RealtimeIndexTask.java        |  643 -------
 .../druid/indexing/common/task/Task.java      |    2 -
 .../parallel/PartialSegmentGenerateTask.java  |   21 +-
 .../batch/parallel/SinglePhaseSubTask.java    |   20 +-
 .../supervisor/SupervisorManager.java         |    1 -
 .../SeekableStreamIndexTask.java              |    6 +-
 .../SeekableStreamIndexTaskRunner.java        |   35 +-
 .../SeekableStreamIndexTaskTuningConfig.java  |   22 +-
 .../seekablestream/SettableByteEntity.java    |    1 -
 .../TaskRealtimeMetricsMonitorTest.java       |    8 +-
 .../actions/RetrieveSegmentsActionsTest.java  |    3 +-
 .../actions/SegmentAllocateActionTest.java    |   17 +-
 ...penderatorDriverRealtimeIndexTaskTest.java | 1706 -----------------
 .../common/task/AppenderatorsTest.java        |  553 ------
 .../common/task/BatchAppenderatorsTest.java   |    8 +-
 .../common/task/CompactionTaskTest.java       |   44 -
 .../indexing/common/task/IndexTaskTest.java   |    2 +-
 .../common/task/RealtimeIndexTaskTest.java    | 1052 ----------
 .../indexing/common/task/TaskSerdeTest.java   |   90 -
 .../common/task/TestAppenderatorsManager.java |   10 +-
 .../indexing/overlord/TaskLifecycleTest.java  |  178 +-
 .../indexing/worker/TaskAnnouncementTest.java |   14 +-
 integration-tests-ex/cases/cluster.sh         |    2 +-
 .../cases/cluster/Common/dependencies.yaml    |   23 +-
 .../cases/cluster/Query/docker-compose.yaml   |  105 +
 integration-tests-ex/cases/pom.xml            |   14 +
 .../druid/testsEx/categories/Query.java       |    6 +-
 .../config/IntegrationTestingConfigEx.java    |    4 +-
 .../druid/testsEx/query/ITUnionQueryTest.java |  213 ++
 .../test/resources/cluster/Common/kafka.yaml  |    2 +-
 .../test/resources/cluster/Query/docker.yaml  |  199 ++
 .../indexer/broadcast_join_index_task.json    |    2 +-
 ...edia_realtime_appenderator_index_task.json |   94 -
 .../wikipedia_realtime_index_task.json        |   98 -
 .../indexer/wikipedia_union_index_task.json   |   98 -
 .../src/test/resources/query/union_data.json  |    0
 .../union_kafka_supervisor_template.json      |   69 +
 .../test/resources/query/union_queries.json   |  566 ++++++
 .../org/apache/druid/tests/TestNGGroup.java   |    4 -
 .../AbstractITRealtimeIndexTaskTest.java      |  198 --
 .../tests/indexer/AbstractIndexerTest.java    |    2 +-
 ...penderatorDriverRealtimeIndexTaskTest.java |  153 --
 .../indexer/ITRealtimeIndexTaskTest.java      |  152 --
 .../druid/tests/query/ITUnionQueryTest.java   |  248 ---
 .../data/broadcast/wikipedia_index_data.json  |   10 +
 .../indexer/broadcast_join_index_task.json    |    2 +-
 ...edia_realtime_appenderator_index_task.json |   94 -
 .../wikipedia_realtime_index_data.json        |   22 -
 .../wikipedia_realtime_index_task.json        |   98 -
 .../indexer/wikipedia_union_index_task.json   |   98 -
 .../test/resources/queries/union_queries.json |  566 ------
 .../common/guava/ThreadRenamingCallable.java  |   50 -
 .../common/concurrent/ScheduledExecutors.java |   10 -
 .../druid/query/filter/SelectorDimFilter.java |    1 -
 .../vector/VectorGroupByEngine.java           |    1 -
 .../DefaultFramedOnHeapAggregatable.java      |    1 -
 .../org/apache/druid/segment/Metadata.java    |    5 -
 .../IncrementalIndexAddResult.java            |    6 -
 .../incremental/RowIngestionMeters.java       |    4 +-
 .../rowsandcols/RowsAndColumnsTestBase.java   |    1 -
 .../ColumnBasedFrameRowsAndColumnsTest.java   |    1 +
 .../guice/NoopSegmentPublisherProvider.java   |   35 -
 .../guice/SQLMetadataStorageDruidModule.java  |   16 -
 .../IndexerMetadataStorageCoordinator.java    |    4 +-
 .../IndexerSQLMetadataStorageCoordinator.java |    4 +-
 .../MetadataSegmentPublisherProvider.java     |   26 -
 .../metadata/SQLMetadataSegmentPublisher.java |  126 --
 .../SQLMetadataSegmentPublisherProvider.java  |   48 -
 .../metadata/SegmentPublisherProvider.java    |   36 -
 .../NoopSegmentHandoffNotifierFactory.java    |    4 +-
 .../druid/segment/indexing/IOConfig.java      |    4 -
 .../segment/indexing/RealtimeIOConfig.java    |   54 -
 .../indexing/RealtimeTuningConfig.java        |  420 ----
 .../druid/segment/indexing/TuningConfig.java  |    4 -
 .../segment/realtime/FireDepartment.java      |  100 -
 .../realtime/FireDepartmentConfig.java        |   58 -
 .../realtime/NoopSegmentPublisher.java        |   33 -
 .../realtime/RealtimeMetricsMonitor.java      |  132 --
 ...ics.java => SegmentGenerationMetrics.java} |   75 +-
 .../segment/realtime/SegmentPublisher.java    |   29 -
 .../appenderator/AppenderatorFactory.java     |   40 -
 .../appenderator/AppenderatorImpl.java        |   12 +-
 .../appenderator/AppenderatorPlumber.java     |  492 -----
 .../AppenderatorPlumberSchool.java            |   84 -
 .../realtime/appenderator/Appenderators.java  |   10 +-
 .../appenderator/AppenderatorsManager.java    |   10 +-
 .../appenderator/BatchAppenderator.java       |   12 +-
 .../DefaultOfflineAppenderatorFactory.java    |   92 -
 .../DefaultRealtimeAppenderatorFactory.java   |  142 --
 ...DummyForInjectionAppenderatorsManager.java |   10 +-
 .../PeonAppenderatorsManager.java             |   10 +-
 .../realtime/appenderator/SegmentSchemas.java |    2 +-
 .../appenderator/SinkQuerySegmentWalker.java  |    4 +-
 .../appenderator/StreamAppenderator.java      |   12 +-
 .../StreamAppenderatorDriver.java             |    6 +-
 .../UnifiedIndexerAppenderatorsManager.java   |   12 +-
 .../plumber/CustomVersioningPolicy.java       |   52 -
 .../realtime/plumber/FlushingPlumber.java     |  238 ---
 .../plumber/FlushingPlumberSchool.java        |  145 --
 .../IntervalStartVersioningPolicy.java        |   31 -
 .../MessageTimeRejectionPolicyFactory.java    |   90 -
 .../plumber/NoopRejectionPolicyFactory.java   |   46 -
 .../segment/realtime/plumber/Plumber.java     |   70 -
 .../realtime/plumber/PlumberSchool.java       |   44 -
 .../segment/realtime/plumber/Plumbers.java    |   96 -
 .../realtime/plumber/RealtimePlumber.java     | 1014 ----------
 .../plumber/RealtimePlumberSchool.java        |  136 --
 .../realtime/plumber/RejectionPolicy.java     |   28 -
 .../plumber/RejectionPolicyFactory.java       |   35 -
 .../ServerTimeRejectionPolicyFactory.java     |   60 -
 .../realtime/plumber/VersioningPolicy.java    |   35 -
 .../{plumber => sink}/Committers.java         |    2 +-
 .../realtime/{plumber => sink}/Sink.java      |   61 +-
 .../SinkSegmentReference.java                 |    2 +-
 .../coordination/DataSegmentAnnouncer.java    |    4 +-
 ...exerSQLMetadataStorageCoordinatorTest.java |  148 +-
 ...SqlMetadataStorageCoordinatorTestBase.java |    3 +-
 .../metadata/SQLMetadataRuleManagerTest.java  |    8 +-
 ...SegmentsMetadataManagerSchemaPollTest.java |   11 +-
 .../SqlSegmentsMetadataManagerTest.java       |  128 +-
 .../SqlSegmentsMetadataManagerTestBase.java   |  127 +-
 .../indexing/RealtimeTuningConfigTest.java    |  151 --
 .../segment/realtime/FireDepartmentTest.java  |  135 --
 .../realtime/RealtimeMetricsMonitorTest.java  |  107 --
 ...java => SegmentGenerationMetricsTest.java} |   12 +-
 .../appenderator/AppenderatorPlumberTest.java |  139 --
 .../appenderator/AppenderatorsTest.java       |  245 +++
 ...edSegmensSinksBatchAppenderatorTester.java |  230 +--
 ...DefaultOfflineAppenderatorFactoryTest.java |  179 --
 ...enAndClosedSegmentsAppenderatorTester.java |   36 +-
 .../StreamAppenderatorDriverFailTest.java     |   10 +-
 .../StreamAppenderatorDriverTest.java         |    4 +-
 .../appenderator/StreamAppenderatorTest.java  |    5 +-
 .../StreamAppenderatorTester.java             |   52 +-
 .../appenderator/TestAppenderatorConfig.java  |  228 +++
 ...nifiedIndexerAppenderatorsManagerTest.java |    4 +-
 .../plumber/CustomVersioningPolicyTest.java   |   50 -
 .../IntervalStartVersioningPolicyTest.java    |   37 -
 ...MessageTimeRejectionPolicyFactoryTest.java |   47 -
 .../plumber/RealtimePlumberSchoolTest.java    |  714 -------
 .../ServerTimeRejectionPolicyFactoryTest.java |   47 -
 .../realtime/{plumber => sink}/SinkTest.java  |  165 +-
 .../apache/druid/server/QueryStackTests.java  |    1 -
 .../duty/KillUnusedSegmentsTest.java          |   17 +-
 .../druid/sql/calcite/rel/DruidQuery.java     |    1 -
 .../druid/sql/calcite/rel/DruidRel.java       |    1 -
 .../sql/calcite/BaseCalciteQueryTest.java     |    1 -
 .../CalciteCatalogIngestionDmlTest.java       |    1 -
 .../sql/calcite/CalciteIngestionDmlTest.java  |    1 -
 ...DecoupledPlanningCalciteJoinQueryTest.java |    1 +
 .../sql/calcite/DecoupledTestConfig.java      |    1 +
 .../sql/calcite/DrillWindowQueryTest.java     |    1 -
 .../druid/sql/calcite/QueryTestBuilder.java   |    1 +
 .../sql/calcite/SqlTestFrameworkConfig.java   |    1 -
 .../planner/CalcitePlannerModuleTest.java     |    1 -
 .../sql/calcite/schema/SystemSchemaTest.java  |    1 +
 website/.spelling                             |    1 -
 176 files changed, 2218 insertions(+), 14272 deletions(-)
 delete mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/index/RealtimeAppenderatorIngestionSpec.java
 delete mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/index/RealtimeAppenderatorTuningConfig.java
 delete mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/task/AppenderatorDriverRealtimeIndexTask.java
 delete mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/task/RealtimeIndexTask.java
 delete mode 100644 indexing-service/src/test/java/org/apache/druid/indexing/common/task/AppenderatorDriverRealtimeIndexTaskTest.java
 delete mode 100644 indexing-service/src/test/java/org/apache/druid/indexing/common/task/AppenderatorsTest.java
 delete mode 100644 indexing-service/src/test/java/org/apache/druid/indexing/common/task/RealtimeIndexTaskTest.java
 create mode 100644 integration-tests-ex/cases/cluster/Query/docker-compose.yaml
 rename server/src/main/java/org/apache/druid/metadata/MetadataSegmentPublisher.java => integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/categories/Query.java (83%)
 create mode 100644 integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/query/ITUnionQueryTest.java
 create mode 100644 integration-tests-ex/cases/src/test/resources/cluster/Query/docker.yaml
 delete mode 100644 integration-tests-ex/cases/src/test/resources/indexer/wikipedia_realtime_appenderator_index_task.json
 delete mode 100644 integration-tests-ex/cases/src/test/resources/indexer/wikipedia_realtime_index_task.json
 delete mode 100644 integration-tests-ex/cases/src/test/resources/indexer/wikipedia_union_index_task.json
 rename integration-tests/src/test/resources/data/union_query/wikipedia_index_data.json => integration-tests-ex/cases/src/test/resources/query/union_data.json (100%)
 create mode 100644 integration-tests-ex/cases/src/test/resources/query/union_kafka_supervisor_template.json
 create mode 100644 integration-tests-ex/cases/src/test/resources/query/union_queries.json
 delete mode 100644 integration-tests/src/test/java/org/apache/druid/tests/indexer/AbstractITRealtimeIndexTaskTest.java
 delete mode 100644 integration-tests/src/test/java/org/apache/druid/tests/indexer/ITAppenderatorDriverRealtimeIndexTaskTest.java
 delete mode 100644 integration-tests/src/test/java/org/apache/druid/tests/indexer/ITRealtimeIndexTaskTest.java
 delete mode 100644 integration-tests/src/test/java/org/apache/druid/tests/query/ITUnionQueryTest.java
 create mode 100644 integration-tests/src/test/resources/data/broadcast/wikipedia_index_data.json
 delete mode 100644 integration-tests/src/test/resources/indexer/wikipedia_realtime_appenderator_index_task.json
 delete mode 100644 integration-tests/src/test/resources/indexer/wikipedia_realtime_index_data.json
 delete mode 100644 integration-tests/src/test/resources/indexer/wikipedia_realtime_index_task.json
 delete mode 100644 integration-tests/src/test/resources/indexer/wikipedia_union_index_task.json
 delete mode 100644 integration-tests/src/test/resources/queries/union_queries.json
 delete mode 100644 processing/src/main/java/org/apache/druid/common/guava/ThreadRenamingCallable.java
 delete mode 100644 server/src/main/java/org/apache/druid/guice/NoopSegmentPublisherProvider.java
 delete mode 100644 server/src/main/java/org/apache/druid/metadata/MetadataSegmentPublisherProvider.java
 delete mode 100644 server/src/main/java/org/apache/druid/metadata/SQLMetadataSegmentPublisher.java
 delete mode 100644 server/src/main/java/org/apache/druid/metadata/SQLMetadataSegmentPublisherProvider.java
 delete mode 100644 server/src/main/java/org/apache/druid/metadata/SegmentPublisherProvider.java
 rename server/src/main/java/org/apache/druid/segment/{realtime/plumber => handoff}/NoopSegmentHandoffNotifierFactory.java (90%)
 delete mode 100644 server/src/main/java/org/apache/druid/segment/indexing/RealtimeIOConfig.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/indexing/RealtimeTuningConfig.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/FireDepartment.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/FireDepartmentConfig.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/NoopSegmentPublisher.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/RealtimeMetricsMonitor.java
 rename server/src/main/java/org/apache/druid/segment/realtime/{FireDepartmentMetrics.java => SegmentGenerationMetrics.java} (79%)
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/SegmentPublisher.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorFactory.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumber.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumberSchool.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/appenderator/DefaultOfflineAppenderatorFactory.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/appenderator/DefaultRealtimeAppenderatorFactory.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/CustomVersioningPolicy.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/FlushingPlumber.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/FlushingPlumberSchool.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/IntervalStartVersioningPolicy.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/MessageTimeRejectionPolicyFactory.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/NoopRejectionPolicyFactory.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/Plumber.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/PlumberSchool.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/Plumbers.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/RealtimePlumber.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/RealtimePlumberSchool.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/RejectionPolicy.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/RejectionPolicyFactory.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/ServerTimeRejectionPolicyFactory.java
 delete mode 100644 server/src/main/java/org/apache/druid/segment/realtime/plumber/VersioningPolicy.java
 rename server/src/main/java/org/apache/druid/segment/realtime/{plumber => sink}/Committers.java (96%)
 rename server/src/main/java/org/apache/druid/segment/realtime/{plumber => sink}/Sink.java (92%)
 rename server/src/main/java/org/apache/druid/segment/realtime/{plumber => sink}/SinkSegmentReference.java (97%)
 delete mode 100644 server/src/test/java/org/apache/druid/segment/indexing/RealtimeTuningConfigTest.java
 delete mode 100644 server/src/test/java/org/apache/druid/segment/realtime/FireDepartmentTest.java
 delete mode 100644 server/src/test/java/org/apache/druid/segment/realtime/RealtimeMetricsMonitorTest.java
 rename server/src/test/java/org/apache/druid/segment/realtime/{FireDepartmentMetricsTest.java => SegmentGenerationMetricsTest.java} (85%)
 delete mode 100644 server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumberTest.java
 create mode 100644 server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorsTest.java
 delete mode 100644 server/src/test/java/org/apache/druid/segment/realtime/appenderator/DefaultOfflineAppenderatorFactoryTest.java
 create mode 100644 server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestAppenderatorConfig.java
 delete mode 100644 server/src/test/java/org/apache/druid/segment/realtime/plumber/CustomVersioningPolicyTest.java
 delete mode 100644 server/src/test/java/org/apache/druid/segment/realtime/plumber/IntervalStartVersioningPolicyTest.java
 delete mode 100644 server/src/test/java/org/apache/druid/segment/realtime/plumber/MessageTimeRejectionPolicyFactoryTest.java
 delete mode 100644 server/src/test/java/org/apache/druid/segment/realtime/plumber/RealtimePlumberSchoolTest.java
 delete mode 100644 server/src/test/java/org/apache/druid/segment/realtime/plumber/ServerTimeRejectionPolicyFactoryTest.java
 rename server/src/test/java/org/apache/druid/segment/realtime/{plumber => sink}/SinkTest.java (74%)

diff --git a/.github/workflows/revised-its.yml b/.github/workflows/revised-its.yml
index 62aac48dc99..069562bf7bd 100644
--- a/.github/workflows/revised-its.yml
+++ b/.github/workflows/revised-its.yml
@@ -50,7 +50,7 @@ jobs:
       matrix:
         #jdk: [8, 11, 17]
         jdk: [8]
-        it: [HighAvailability, MultiStageQuery, Catalog, BatchIndex, MultiStageQueryWithMM, InputSource, InputFormat, Security]
+        it: [HighAvailability, MultiStageQuery, Catalog, BatchIndex, MultiStageQueryWithMM, InputSource, InputFormat, Security, Query]
         #indexer: [indexer, middleManager]
         indexer: [middleManager]
     uses: ./.github/workflows/reusable-revised-its.yml
diff --git a/distribution/bin/tag-missing-milestones.py b/distribution/bin/tag-missing-milestones.py
index e25ca743749..cf41afd63b6 100755
--- a/distribution/bin/tag-missing-milestones.py
+++ b/distribution/bin/tag-missing-milestones.py
@@ -16,10 +16,9 @@
 # limitations under the License.
 
 import os
+import requests
 import subprocess
 import sys
-import requests
-
 
 if len(sys.argv) != 5:
   sys.stderr.write('usage: program <github-username> <previous-release-commit> <new-release-commit> <milestone-number-to-tag>\n')
diff --git a/docs/ingestion/tranquility.md b/docs/ingestion/tranquility.md
index 9cc0636fd6c..9124ff04b86 100644
--- a/docs/ingestion/tranquility.md
+++ b/docs/ingestion/tranquility.md
@@ -22,15 +22,9 @@ title: "Tranquility"
   ~ under the License.
   -->
 
-[Tranquility](https://github.com/druid-io/tranquility/) is a separately distributed package for pushing
-streams to Druid in real-time. 
-
-Tranquility has not been built against a version of Druid later than Druid 0.9.2
-release. It may still work with the latest Druid servers, but not all features and functionality will be available
-due to limitations of older Druid APIs on the Tranquility side.
+[Tranquility](https://github.com/druid-io/tranquility/) was a separately distributed package for pushing
+streams to Druid in real-time. It is not compatible with recent versions of Druid.
 
 For new projects that require streaming ingestion, we recommend using Druid's native support for
 [Apache Kafka](../ingestion/kafka-ingestion.md) or
 [Amazon Kinesis](../ingestion/kinesis-ingestion.md).
-
-For more details, check out the [Tranquility GitHub page](https://github.com/druid-io/tranquility/).
diff --git a/extensions-contrib/materialized-view-maintenance/src/test/java/org/apache/druid/indexing/materializedview/MaterializedViewSupervisorTest.java b/extensions-contrib/materialized-view-maintenance/src/test/java/org/apache/druid/indexing/materializedview/MaterializedViewSupervisorTest.java
index 80a5408cfe3..38f15a840dc 100644
--- a/extensions-contrib/materialized-view-maintenance/src/test/java/org/apache/druid/indexing/materializedview/MaterializedViewSupervisorTest.java
+++ b/extensions-contrib/materialized-view-maintenance/src/test/java/org/apache/druid/indexing/materializedview/MaterializedViewSupervisorTest.java
@@ -64,7 +64,6 @@ import org.junit.Before;
 import org.junit.Rule;
 import org.junit.Test;
 
-import java.io.IOException;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
@@ -145,7 +144,7 @@ public class MaterializedViewSupervisorTest
   }
 
   @Test
-  public void testCheckSegments() throws IOException
+  public void testCheckSegments()
   {
     List<DataSegment> baseSegments = createBaseSegments();
     Set<DataSegment> derivativeSegments = Sets.newHashSet(createDerivativeSegments());
@@ -171,7 +170,7 @@ public class MaterializedViewSupervisorTest
   }
 
   @Test
-  public void testSubmitTasksDoesNotFailIfTaskAlreadyExists() throws IOException
+  public void testSubmitTasksDoesNotFailIfTaskAlreadyExists()
   {
     Set<DataSegment> baseSegments = Sets.newHashSet(createBaseSegments());
     Set<DataSegment> derivativeSegments = Sets.newHashSet(createDerivativeSegments());
@@ -193,7 +192,7 @@ public class MaterializedViewSupervisorTest
   }
 
   @Test
-  public void testSubmitTasksFailsIfTaskCannotBeAdded() throws IOException
+  public void testSubmitTasksFailsIfTaskCannotBeAdded()
   {
     Set<DataSegment> baseSegments = Sets.newHashSet(createBaseSegments());
     Set<DataSegment> derivativeSegments = Sets.newHashSet(createDerivativeSegments());
@@ -219,7 +218,7 @@ public class MaterializedViewSupervisorTest
   }
 
   @Test
-  public void testCheckSegmentsAndSubmitTasks() throws IOException
+  public void testCheckSegmentsAndSubmitTasks()
   {
     Set<DataSegment> baseSegments = Collections.singleton(createBaseSegments().get(0));
     indexerMetadataStorageCoordinator.commitSegments(baseSegments, null);
diff --git a/extensions-contrib/materialized-view-selection/src/test/java/org/apache/druid/query/materializedview/DatasourceOptimizerTest.java b/extensions-contrib/materialized-view-selection/src/test/java/org/apache/druid/query/materializedview/DatasourceOptimizerTest.java
index bb6d649f70e..98ab56022db 100644
--- a/extensions-contrib/materialized-view-selection/src/test/java/org/apache/druid/query/materializedview/DatasourceOptimizerTest.java
+++ b/extensions-contrib/materialized-view-selection/src/test/java/org/apache/druid/query/materializedview/DatasourceOptimizerTest.java
@@ -178,13 +178,8 @@ public class DatasourceOptimizerTest extends CuratorTestBase
               Lists.newArrayList("dim1", "dim2", "dim3", "dim4"),
               1024 * 1024
           );
-          try {
-            metadataStorageCoordinator.commitSegments(Sets.newHashSet(segment), null);
-            announceSegmentForServer(druidServer, segment, zkPathsConfig, jsonMapper);
-          }
-          catch (IOException e) {
-            return false;
-          }
+          metadataStorageCoordinator.commitSegments(Sets.newHashSet(segment), null);
+          announceSegmentForServer(druidServer, segment, zkPathsConfig, jsonMapper);
           return true;
         }
     );
@@ -203,13 +198,8 @@ public class DatasourceOptimizerTest extends CuratorTestBase
               Lists.newArrayList("dim1", "dim2", "dim3"),
               1024
           );
-          try {
-            metadataStorageCoordinator.commitSegments(Sets.newHashSet(segment), null);
-            announceSegmentForServer(druidServer, segment, zkPathsConfig, jsonMapper);
-          }
-          catch (IOException e) {
-            return false;
-          }
+          metadataStorageCoordinator.commitSegments(Sets.newHashSet(segment), null);
+          announceSegmentForServer(druidServer, segment, zkPathsConfig, jsonMapper);
           return true;
         }
     );
diff --git a/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/BloomFilterAggregatorTest.java b/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/BloomFilterAggregatorTest.java
index d680abcadf3..5888b7d13dd 100644
--- a/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/BloomFilterAggregatorTest.java
+++ b/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/BloomFilterAggregatorTest.java
@@ -49,7 +49,6 @@ import org.junit.Assert;
 import org.junit.Test;
 
 import javax.annotation.Nullable;
-
 import java.io.IOException;
 import java.nio.ByteBuffer;
 import java.util.Arrays;
diff --git a/extensions-core/druid-pac4j/src/main/java/org/apache/druid/security/pac4j/Pac4jFilter.java b/extensions-core/druid-pac4j/src/main/java/org/apache/druid/security/pac4j/Pac4jFilter.java
index db7d5affe90..05a4ce78b44 100644
--- a/extensions-core/druid-pac4j/src/main/java/org/apache/druid/security/pac4j/Pac4jFilter.java
+++ b/extensions-core/druid-pac4j/src/main/java/org/apache/druid/security/pac4j/Pac4jFilter.java
@@ -41,7 +41,6 @@ import javax.servlet.ServletRequest;
 import javax.servlet.ServletResponse;
 import javax.servlet.http.HttpServletRequest;
 import javax.servlet.http.HttpServletResponse;
-
 import java.io.IOException;
 import java.util.Collection;
 
diff --git a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/KafkaIndexTaskTest.java b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/KafkaIndexTaskTest.java
index 5ee288d2622..1309ed0dde0 100644
--- a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/KafkaIndexTaskTest.java
+++ b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/KafkaIndexTaskTest.java
@@ -367,7 +367,7 @@ public class KafkaIndexTaskTest extends SeekableStreamIndexTaskTestBase
     // Wait for task to exit
     Assert.assertEquals(TaskState.SUCCESS, future.get().getStatusCode());
     verifyTaskMetrics(task, RowMeters.with().bytes(getTotalSizeOfRecords(2, 5)).totalProcessed(3));
-    Assert.assertTrue(task.getRunner().getFireDepartmentMetrics().isProcessingDone());
+    Assert.assertTrue(task.getRunner().getSegmentGenerationMetrics().isProcessingDone());
 
     // Check published metadata and segments in deep storage
     assertEqualsExceptVersion(
@@ -505,7 +505,7 @@ public class KafkaIndexTaskTest extends SeekableStreamIndexTaskTestBase
     // Wait for task to exit
     Assert.assertEquals(TaskState.SUCCESS, future.get().getStatusCode());
     verifyTaskMetrics(task, RowMeters.with().bytes(getTotalSizeOfRecords(2, 5)).totalProcessed(3));
-    Assert.assertTrue(task.getRunner().getFireDepartmentMetrics().isProcessingDone());
+    Assert.assertTrue(task.getRunner().getSegmentGenerationMetrics().isProcessingDone());
 
     // Check published metadata and segments in deep storage
     assertEqualsExceptVersion(
@@ -554,7 +554,7 @@ public class KafkaIndexTaskTest extends SeekableStreamIndexTaskTestBase
     // Wait for task to exit
     Assert.assertEquals(TaskState.SUCCESS, future.get().getStatusCode());
     verifyTaskMetrics(task, RowMeters.with().bytes(getTotalSizeOfRecords(2, 5)).totalProcessed(3));
-    Assert.assertTrue(task.getRunner().getFireDepartmentMetrics().isProcessingDone());
+    Assert.assertTrue(task.getRunner().getSegmentGenerationMetrics().isProcessingDone());
 
     // Check published metadata and segments in deep storage
     assertEqualsExceptVersion(
diff --git a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/supervisor/KafkaSupervisorTest.java b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/supervisor/KafkaSupervisorTest.java
index a7d47788325..b18c1749125 100644
--- a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/supervisor/KafkaSupervisorTest.java
+++ b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/supervisor/KafkaSupervisorTest.java
@@ -40,7 +40,7 @@ import org.apache.druid.indexer.TaskLocation;
 import org.apache.druid.indexer.TaskStatus;
 import org.apache.druid.indexing.common.TaskInfoProvider;
 import org.apache.druid.indexing.common.TestUtils;
-import org.apache.druid.indexing.common.task.RealtimeIndexTask;
+import org.apache.druid.indexing.common.task.NoopTask;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.indexing.kafka.KafkaConsumerConfigs;
 import org.apache.druid.indexing.kafka.KafkaDataSourceMetadata;
@@ -89,9 +89,7 @@ import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.incremental.ParseExceptionReport;
 import org.apache.druid.segment.incremental.RowIngestionMetersFactory;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.apache.druid.segment.realtime.FireDepartment;
 import org.apache.druid.server.metrics.NoopServiceEmitter;
 import org.apache.druid.server.security.Action;
 import org.apache.druid.server.security.Resource;
@@ -1194,15 +1192,13 @@ public class KafkaSupervisorTest extends EasyMockSupport
     addSomeEvents(1);
 
     // non KafkaIndexTask (don't kill)
-    Task id2 = new RealtimeIndexTask(
+    Task id2 = new NoopTask(
         "id2",
         null,
-        new FireDepartment(
-            dataSchema,
-            new RealtimeIOConfig(null, null),
-            null
-        ),
-        null
+        dataSchema.getDataSource(),
+        100,
+        100,
+        ImmutableMap.of()
     );
 
     List<Task> existingTasks = ImmutableList.of(id2);
diff --git a/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/supervisor/KinesisSupervisorTest.java b/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/supervisor/KinesisSupervisorTest.java
index a4ab6a30a80..9001f148e99 100644
--- a/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/supervisor/KinesisSupervisorTest.java
+++ b/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/supervisor/KinesisSupervisorTest.java
@@ -37,7 +37,7 @@ import org.apache.druid.indexer.TaskLocation;
 import org.apache.druid.indexer.TaskStatus;
 import org.apache.druid.indexing.common.TaskInfoProvider;
 import org.apache.druid.indexing.common.TestUtils;
-import org.apache.druid.indexing.common.task.RealtimeIndexTask;
+import org.apache.druid.indexing.common.task.NoopTask;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.indexing.kinesis.KinesisDataSourceMetadata;
 import org.apache.druid.indexing.kinesis.KinesisIndexTask;
@@ -84,9 +84,7 @@ import org.apache.druid.query.aggregation.CountAggregatorFactory;
 import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.incremental.RowIngestionMetersFactory;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.apache.druid.segment.realtime.FireDepartment;
 import org.apache.druid.server.metrics.NoopServiceEmitter;
 import org.apache.druid.server.security.Action;
 import org.apache.druid.server.security.Resource;
@@ -940,15 +938,13 @@ public class KinesisSupervisorTest extends EasyMockSupport
     EasyMock.expectLastCall().anyTimes();
 
     // non KinesisIndexTask (don't kill)
-    Task id2 = new RealtimeIndexTask(
+    Task id2 = new NoopTask(
         "id2",
         null,
-        new FireDepartment(
-            dataSchema,
-            new RealtimeIOConfig(null, null),
-            null
-        ),
-        null
+        dataSchema.getDataSource(),
+        100,
+        100,
+        ImmutableMap.of()
     );
 
     List<Task> existingTasks = ImmutableList.of(id2);
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/counters/SegmentGeneratorMetricsWrapper.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/counters/SegmentGeneratorMetricsWrapper.java
index 8f3e2d79aae..81f67a9ce05 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/counters/SegmentGeneratorMetricsWrapper.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/counters/SegmentGeneratorMetricsWrapper.java
@@ -20,15 +20,15 @@
 package org.apache.druid.msq.counters;
 
 import org.apache.druid.msq.indexing.processor.SegmentGeneratorFrameProcessor;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 
 /**
- * Wrapper around {@link FireDepartmentMetrics} which updates the progress counters while updating its metrics. This
+ * Wrapper around {@link SegmentGenerationMetrics} which updates the progress counters while updating its metrics. This
  * is necessary as the {@link org.apache.druid.segment.realtime.appenderator.BatchAppenderator} used by the
  * {@link SegmentGeneratorFrameProcessor} is not part of the MSQ extension, and hence,
  * cannot update the counters used in MSQ reports as it persists and pushes segments to deep storage.
  */
-public class SegmentGeneratorMetricsWrapper extends FireDepartmentMetrics
+public class SegmentGeneratorMetricsWrapper extends SegmentGenerationMetrics
 {
   private final SegmentGenerationProgressCounter segmentGenerationProgressCounter;
 
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/CalciteMSQTestsHelper.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/CalciteMSQTestsHelper.java
index 888a1f3f547..a144a0b3594 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/CalciteMSQTestsHelper.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/CalciteMSQTestsHelper.java
@@ -88,7 +88,6 @@ import org.joda.time.Interval;
 import org.mockito.Mockito;
 
 import javax.annotation.Nullable;
-
 import java.io.File;
 import java.util.List;
 import java.util.Set;
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/TaskRealtimeMetricsMonitorBuilder.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/TaskRealtimeMetricsMonitorBuilder.java
index abd95169073..8129b16a531 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/TaskRealtimeMetricsMonitorBuilder.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/TaskRealtimeMetricsMonitorBuilder.java
@@ -19,14 +19,12 @@
 
 package org.apache.druid.indexing.common;
 
-import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import org.apache.druid.indexing.common.stats.TaskRealtimeMetricsMonitor;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.query.DruidMetrics;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.RealtimeMetricsMonitor;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 
 public class TaskRealtimeMetricsMonitorBuilder
 {
@@ -34,31 +32,21 @@ public class TaskRealtimeMetricsMonitorBuilder
   {
   }
 
-  public static RealtimeMetricsMonitor build(Task task, FireDepartment fireDepartment)
-  {
-    return new RealtimeMetricsMonitor(
-        ImmutableList.of(fireDepartment),
-        ImmutableMap.of(
-            DruidMetrics.TASK_ID, new String[]{task.getId()},
-            DruidMetrics.TASK_TYPE, new String[]{task.getType()}
-        )
-    );
-  }
-
   public static TaskRealtimeMetricsMonitor build(
       Task task,
-      FireDepartment fireDepartment,
+      SegmentGenerationMetrics metrics,
       RowIngestionMeters meters
   )
   {
     return new TaskRealtimeMetricsMonitor(
-        fireDepartment,
+        metrics,
         meters,
         ImmutableMap.of(
+            DruidMetrics.DATASOURCE, new String[]{task.getDataSource()},
             DruidMetrics.TASK_ID, new String[]{task.getId()},
             DruidMetrics.TASK_TYPE, new String[]{task.getType()},
             DruidMetrics.GROUP_ID, new String[]{task.getGroupId()}
-            ),
+        ),
         task.getContextValue(DruidMetrics.TAGS)
     );
   }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/index/RealtimeAppenderatorIngestionSpec.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/index/RealtimeAppenderatorIngestionSpec.java
deleted file mode 100644
index c244a0c509d..00000000000
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/index/RealtimeAppenderatorIngestionSpec.java
+++ /dev/null
@@ -1,40 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.indexing.common.index;
-
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.IngestionSpec;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-
-public class RealtimeAppenderatorIngestionSpec extends IngestionSpec<RealtimeIOConfig, RealtimeAppenderatorTuningConfig>
-{
-
-  @JsonCreator
-  public RealtimeAppenderatorIngestionSpec(
-      @JsonProperty("dataSchema") DataSchema dataSchema,
-      @JsonProperty("ioConfig") RealtimeIOConfig ioConfig,
-      @JsonProperty("tuningConfig") RealtimeAppenderatorTuningConfig tuningConfig
-  )
-  {
-    super(dataSchema, ioConfig, tuningConfig);
-  }
-}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/index/RealtimeAppenderatorTuningConfig.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/index/RealtimeAppenderatorTuningConfig.java
deleted file mode 100644
index 4a117976e18..00000000000
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/index/RealtimeAppenderatorTuningConfig.java
+++ /dev/null
@@ -1,357 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.indexing.common.index;
-
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import com.fasterxml.jackson.annotation.JsonTypeName;
-import com.google.common.base.Preconditions;
-import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
-import org.apache.druid.segment.IndexSpec;
-import org.apache.druid.segment.incremental.AppendableIndexSpec;
-import org.apache.druid.segment.indexing.TuningConfig;
-import org.apache.druid.segment.realtime.appenderator.AppenderatorConfig;
-import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
-import org.apache.druid.timeline.partition.NumberedShardSpec;
-import org.apache.druid.timeline.partition.ShardSpec;
-import org.joda.time.Period;
-
-import javax.annotation.Nullable;
-import java.io.File;
-
-@JsonTypeName("realtime_appenderator")
-public class RealtimeAppenderatorTuningConfig implements AppenderatorConfig
-{
-  private static final Period DEFAULT_INTERMEDIATE_PERSIST_PERIOD = new Period("PT10M");
-  private static final int DEFAULT_MAX_PENDING_PERSISTS = 0;
-  private static final ShardSpec DEFAULT_SHARD_SPEC = new NumberedShardSpec(0, 1);
-  private static final IndexSpec DEFAULT_INDEX_SPEC = IndexSpec.DEFAULT;
-  private static final Boolean DEFAULT_REPORT_PARSE_EXCEPTIONS = Boolean.FALSE;
-  private static final long DEFAULT_HANDOFF_CONDITION_TIMEOUT = 0;
-  private static final long DEFAULT_ALERT_TIMEOUT = 0;
-
-  private final AppendableIndexSpec appendableIndexSpec;
-  private final int maxRowsInMemory;
-  private final long maxBytesInMemory;
-  private final boolean skipBytesInMemoryOverheadCheck;
-  private final DynamicPartitionsSpec partitionsSpec;
-  private final Period intermediatePersistPeriod;
-  private final File basePersistDirectory;
-  private final int maxPendingPersists;
-  private final ShardSpec shardSpec;
-  private final IndexSpec indexSpec;
-  private final IndexSpec indexSpecForIntermediatePersists;
-  private final boolean reportParseExceptions;
-  private final long publishAndHandoffTimeout;
-  private final long alertTimeout;
-  @Nullable
-  private final SegmentWriteOutMediumFactory segmentWriteOutMediumFactory;
-
-  private final boolean logParseExceptions;
-  private final int maxParseExceptions;
-  private final int maxSavedParseExceptions;
-
-  private final int numPersistThreads;
-
-  public RealtimeAppenderatorTuningConfig(
-      @Nullable AppendableIndexSpec appendableIndexSpec,
-      Integer maxRowsInMemory,
-      @Nullable Long maxBytesInMemory,
-      @Nullable Boolean skipBytesInMemoryOverheadCheck,
-      @Nullable Integer maxRowsPerSegment,
-      @Nullable Long maxTotalRows,
-      Period intermediatePersistPeriod,
-      File basePersistDirectory,
-      Integer maxPendingPersists,
-      ShardSpec shardSpec,
-      IndexSpec indexSpec,
-      @Nullable IndexSpec indexSpecForIntermediatePersists,
-      Boolean reportParseExceptions,
-      Long publishAndHandoffTimeout,
-      Long alertTimeout,
-      @Nullable SegmentWriteOutMediumFactory segmentWriteOutMediumFactory,
-      @Nullable Boolean logParseExceptions,
-      @Nullable Integer maxParseExceptions,
-      @Nullable Integer maxSavedParseExceptions,
-      @Nullable Integer numPersistThreads
-  )
-  {
-    this.appendableIndexSpec = appendableIndexSpec == null ? DEFAULT_APPENDABLE_INDEX : appendableIndexSpec;
-    this.maxRowsInMemory = maxRowsInMemory == null ? DEFAULT_MAX_ROWS_IN_MEMORY_REALTIME : maxRowsInMemory;
-    // initializing this to 0, it will be lazily initialized to a value
-    // @see #getMaxBytesInMemoryOrDefault()
-    this.maxBytesInMemory = maxBytesInMemory == null ? 0 : maxBytesInMemory;
-    this.skipBytesInMemoryOverheadCheck = skipBytesInMemoryOverheadCheck == null ?
-                                          DEFAULT_SKIP_BYTES_IN_MEMORY_OVERHEAD_CHECK : skipBytesInMemoryOverheadCheck;
-    this.partitionsSpec = new DynamicPartitionsSpec(maxRowsPerSegment, maxTotalRows);
-    this.intermediatePersistPeriod = intermediatePersistPeriod == null
-                                     ? DEFAULT_INTERMEDIATE_PERSIST_PERIOD
-                                     : intermediatePersistPeriod;
-    this.basePersistDirectory = basePersistDirectory;
-    this.maxPendingPersists = maxPendingPersists == null ? DEFAULT_MAX_PENDING_PERSISTS : maxPendingPersists;
-    this.shardSpec = shardSpec == null ? DEFAULT_SHARD_SPEC : shardSpec;
-    this.indexSpec = indexSpec == null ? DEFAULT_INDEX_SPEC : indexSpec;
-    this.indexSpecForIntermediatePersists = indexSpecForIntermediatePersists == null ?
-                                            this.indexSpec : indexSpecForIntermediatePersists;
-    this.reportParseExceptions = reportParseExceptions == null
-                                 ? DEFAULT_REPORT_PARSE_EXCEPTIONS
-                                 : reportParseExceptions;
-    this.publishAndHandoffTimeout = publishAndHandoffTimeout == null
-                                    ? DEFAULT_HANDOFF_CONDITION_TIMEOUT
-                                    : publishAndHandoffTimeout;
-    Preconditions.checkArgument(this.publishAndHandoffTimeout >= 0, "publishAndHandoffTimeout must be >= 0");
-
-    this.alertTimeout = alertTimeout == null ? DEFAULT_ALERT_TIMEOUT : alertTimeout;
-    Preconditions.checkArgument(this.alertTimeout >= 0, "alertTimeout must be >= 0");
-    this.segmentWriteOutMediumFactory = segmentWriteOutMediumFactory;
-
-    if (this.reportParseExceptions) {
-      this.maxParseExceptions = 0;
-      this.maxSavedParseExceptions = maxSavedParseExceptions == null ? 0 : Math.min(1, maxSavedParseExceptions);
-    } else {
-      this.maxParseExceptions = maxParseExceptions == null
-                                ? TuningConfig.DEFAULT_MAX_PARSE_EXCEPTIONS
-                                : maxParseExceptions;
-      this.maxSavedParseExceptions = maxSavedParseExceptions == null
-                                     ? TuningConfig.DEFAULT_MAX_SAVED_PARSE_EXCEPTIONS
-                                     : maxSavedParseExceptions;
-    }
-    this.logParseExceptions = logParseExceptions == null
-                              ? TuningConfig.DEFAULT_LOG_PARSE_EXCEPTIONS
-                              : logParseExceptions;
-    this.numPersistThreads = numPersistThreads == null ?
-            DEFAULT_NUM_PERSIST_THREADS : Math.max(numPersistThreads, DEFAULT_NUM_PERSIST_THREADS);
-  }
-
-  @JsonCreator
-  private RealtimeAppenderatorTuningConfig(
-      @JsonProperty("appendableIndexSpec") @Nullable AppendableIndexSpec appendableIndexSpec,
-      @JsonProperty("maxRowsInMemory") Integer maxRowsInMemory,
-      @JsonProperty("maxBytesInMemory") @Nullable Long maxBytesInMemory,
-      @JsonProperty("skipBytesInMemoryOverheadCheck") @Nullable Boolean skipBytesInMemoryOverheadCheck,
-      @JsonProperty("maxRowsPerSegment") @Nullable Integer maxRowsPerSegment,
-      @JsonProperty("maxTotalRows") @Nullable Long maxTotalRows,
-      @JsonProperty("intermediatePersistPeriod") Period intermediatePersistPeriod,
-      @JsonProperty("maxPendingPersists") Integer maxPendingPersists,
-      @JsonProperty("shardSpec") ShardSpec shardSpec,
-      @JsonProperty("indexSpec") IndexSpec indexSpec,
-      @JsonProperty("indexSpecForIntermediatePersists") @Nullable IndexSpec indexSpecForIntermediatePersists,
-      @JsonProperty("reportParseExceptions") Boolean reportParseExceptions,
-      @JsonProperty("publishAndHandoffTimeout") Long publishAndHandoffTimeout,
-      @JsonProperty("alertTimeout") Long alertTimeout,
-      @JsonProperty("segmentWriteOutMediumFactory") @Nullable SegmentWriteOutMediumFactory segmentWriteOutMediumFactory,
-      @JsonProperty("logParseExceptions") @Nullable Boolean logParseExceptions,
-      @JsonProperty("maxParseExceptions") @Nullable Integer maxParseExceptions,
-      @JsonProperty("maxSavedParseExceptions") @Nullable Integer maxSavedParseExceptions,
-      @JsonProperty("numPersistThreads") @Nullable Integer numPersistThreads
-  )
-  {
-    this(
-        appendableIndexSpec,
-        maxRowsInMemory,
-        maxBytesInMemory,
-        skipBytesInMemoryOverheadCheck,
-        maxRowsPerSegment,
-        maxTotalRows,
-        intermediatePersistPeriod,
-        null,
-        maxPendingPersists,
-        shardSpec,
-        indexSpec,
-        indexSpecForIntermediatePersists,
-        reportParseExceptions,
-        publishAndHandoffTimeout,
-        alertTimeout,
-        segmentWriteOutMediumFactory,
-        logParseExceptions,
-        maxParseExceptions,
-        maxSavedParseExceptions,
-        numPersistThreads
-    );
-  }
-
-  @Override
-  @JsonProperty
-  public AppendableIndexSpec getAppendableIndexSpec()
-  {
-    return appendableIndexSpec;
-  }
-
-  @Override
-  @JsonProperty
-  public int getMaxRowsInMemory()
-  {
-    return maxRowsInMemory;
-  }
-
-  @Override
-  @JsonProperty
-  public long getMaxBytesInMemory()
-  {
-    return maxBytesInMemory;
-  }
-
-  @JsonProperty
-  @Override
-  public boolean isSkipBytesInMemoryOverheadCheck()
-  {
-    return skipBytesInMemoryOverheadCheck;
-  }
-
-  @Override
-  @JsonProperty
-  public Integer getMaxRowsPerSegment()
-  {
-    return partitionsSpec.getMaxRowsPerSegment();
-  }
-
-  @Override
-  @JsonProperty
-  @Nullable
-  public Long getMaxTotalRows()
-  {
-    return partitionsSpec.getMaxTotalRows();
-  }
-
-  @Override
-  public DynamicPartitionsSpec getPartitionsSpec()
-  {
-    return partitionsSpec;
-  }
-
-  @Override
-  @JsonProperty
-  public Period getIntermediatePersistPeriod()
-  {
-    return intermediatePersistPeriod;
-  }
-
-  @Override
-  public File getBasePersistDirectory()
-  {
-    return Preconditions.checkNotNull(basePersistDirectory, "basePersistDirectory not set");
-  }
-
-  @Override
-  @JsonProperty
-  public int getMaxPendingPersists()
-  {
-    return maxPendingPersists;
-  }
-
-  @JsonProperty
-  public ShardSpec getShardSpec()
-  {
-    return shardSpec;
-  }
-
-  @Override
-  @JsonProperty
-  public IndexSpec getIndexSpec()
-  {
-    return indexSpec;
-  }
-
-  @JsonProperty
-  @Override
-  public IndexSpec getIndexSpecForIntermediatePersists()
-  {
-    return indexSpecForIntermediatePersists;
-  }
-
-  @Override
-  @JsonProperty
-  public boolean isReportParseExceptions()
-  {
-    return reportParseExceptions;
-  }
-
-  @JsonProperty
-  public long getPublishAndHandoffTimeout()
-  {
-    return publishAndHandoffTimeout;
-  }
-
-  @JsonProperty
-  public long getAlertTimeout()
-  {
-    return alertTimeout;
-  }
-
-  @Override
-  @JsonProperty
-  @Nullable
-  public SegmentWriteOutMediumFactory getSegmentWriteOutMediumFactory()
-  {
-    return segmentWriteOutMediumFactory;
-  }
-
-  @JsonProperty
-  public boolean isLogParseExceptions()
-  {
-    return logParseExceptions;
-  }
-
-  @JsonProperty
-  public int getMaxParseExceptions()
-  {
-    return maxParseExceptions;
-  }
-
-  @JsonProperty
-  public int getMaxSavedParseExceptions()
-  {
-    return maxSavedParseExceptions;
-  }
-
-  @Override
-  @JsonProperty
-  public int getNumPersistThreads()
-  {
-    return numPersistThreads;
-  }
-
-  @Override
-  public RealtimeAppenderatorTuningConfig withBasePersistDirectory(File dir)
-  {
-    return new RealtimeAppenderatorTuningConfig(
-        appendableIndexSpec,
-        maxRowsInMemory,
-        maxBytesInMemory,
-        skipBytesInMemoryOverheadCheck,
-        partitionsSpec.getMaxRowsPerSegment(),
-        partitionsSpec.getMaxTotalRows(),
-        intermediatePersistPeriod,
-        dir,
-        maxPendingPersists,
-        shardSpec,
-        indexSpec,
-        indexSpecForIntermediatePersists,
-        reportParseExceptions,
-        publishAndHandoffTimeout,
-        alertTimeout,
-        segmentWriteOutMediumFactory,
-        logParseExceptions,
-        maxParseExceptions,
-        maxSavedParseExceptions,
-        numPersistThreads
-    );
-  }
-}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/stats/TaskRealtimeMetricsMonitor.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/stats/TaskRealtimeMetricsMonitor.java
index 393035b03ef..2fb11cd7a12 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/stats/TaskRealtimeMetricsMonitor.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/stats/TaskRealtimeMetricsMonitor.java
@@ -28,54 +28,49 @@ import org.apache.druid.java.util.metrics.MonitorUtils;
 import org.apache.druid.query.DruidMetrics;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
 import org.apache.druid.segment.incremental.RowIngestionMetersTotals;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 
 import javax.annotation.Nullable;
 import java.util.Map;
 
 /**
- * Replaces the old RealtimeMetricsMonitor for indexing tasks that use a single FireDepartment, with changes to
- * read row ingestion stats from RowIngestionMeters (which supports moving averages) instead of FireDepartmentMetrics.
- * See comment on RowIngestionMeters for more information regarding relationship between RowIngestionMeters and
- * FireDepartmentMetrics.
+ * Emits metrics from {@link SegmentGenerationMetrics} and {@link RowIngestionMeters}.
  */
 public class TaskRealtimeMetricsMonitor extends AbstractMonitor
 {
   private static final EmittingLogger log = new EmittingLogger(TaskRealtimeMetricsMonitor.class);
 
-  private final FireDepartment fireDepartment;
+  private final SegmentGenerationMetrics segmentGenerationMetrics;
   private final RowIngestionMeters rowIngestionMeters;
   private final Map<String, String[]> dimensions;
   @Nullable
   private final Map<String, Object> metricTags;
 
-  private FireDepartmentMetrics previousFireDepartmentMetrics;
+  private SegmentGenerationMetrics previousSegmentGenerationMetrics;
   private RowIngestionMetersTotals previousRowIngestionMetersTotals;
 
   public TaskRealtimeMetricsMonitor(
-      FireDepartment fireDepartment,
+      SegmentGenerationMetrics segmentGenerationMetrics,
       RowIngestionMeters rowIngestionMeters,
       Map<String, String[]> dimensions,
       @Nullable Map<String, Object> metricTags
   )
   {
-    this.fireDepartment = fireDepartment;
+    this.segmentGenerationMetrics = segmentGenerationMetrics;
     this.rowIngestionMeters = rowIngestionMeters;
     this.dimensions = ImmutableMap.copyOf(dimensions);
     this.metricTags = metricTags;
-    previousFireDepartmentMetrics = new FireDepartmentMetrics();
+    previousSegmentGenerationMetrics = new SegmentGenerationMetrics();
     previousRowIngestionMetersTotals = new RowIngestionMetersTotals(0, 0, 0, 0, 0);
   }
 
   @Override
   public boolean doMonitor(ServiceEmitter emitter)
   {
-    FireDepartmentMetrics metrics = fireDepartment.getMetrics().snapshot();
+    SegmentGenerationMetrics metrics = segmentGenerationMetrics.snapshot();
     RowIngestionMetersTotals rowIngestionMetersTotals = rowIngestionMeters.getTotals();
 
-    final ServiceMetricEvent.Builder builder = new ServiceMetricEvent.Builder()
-        .setDimension(DruidMetrics.DATASOURCE, fireDepartment.getDataSchema().getDataSource());
+    final ServiceMetricEvent.Builder builder = new ServiceMetricEvent.Builder();
     MonitorUtils.addDimensionsToBuilder(builder, dimensions);
 
     final long thrownAway = rowIngestionMetersTotals.getThrownAway() - previousRowIngestionMetersTotals.getThrownAway();
@@ -103,7 +98,7 @@ public class TaskRealtimeMetricsMonitor extends AbstractMonitor
 
     emitter.emit(builder.setMetric("ingest/events/processed", rowIngestionMetersTotals.getProcessed() - previousRowIngestionMetersTotals.getProcessed()));
 
-    final long dedup = metrics.dedup() - previousFireDepartmentMetrics.dedup();
+    final long dedup = metrics.dedup() - previousSegmentGenerationMetrics.dedup();
     if (dedup > 0) {
       log.warn("[%,d] duplicate events!", dedup);
     }
@@ -115,21 +110,21 @@ public class TaskRealtimeMetricsMonitor extends AbstractMonitor
         )
     );
 
-    emitter.emit(builder.setMetric("ingest/rows/output", metrics.rowOutput() - previousFireDepartmentMetrics.rowOutput()));
-    emitter.emit(builder.setMetric("ingest/persists/count", metrics.numPersists() - previousFireDepartmentMetrics.numPersists()));
-    emitter.emit(builder.setMetric("ingest/persists/time", metrics.persistTimeMillis() - previousFireDepartmentMetrics.persistTimeMillis()));
-    emitter.emit(builder.setMetric("ingest/persists/cpu", metrics.persistCpuTime() - previousFireDepartmentMetrics.persistCpuTime()));
+    emitter.emit(builder.setMetric("ingest/rows/output", metrics.rowOutput() - previousSegmentGenerationMetrics.rowOutput()));
+    emitter.emit(builder.setMetric("ingest/persists/count", metrics.numPersists() - previousSegmentGenerationMetrics.numPersists()));
+    emitter.emit(builder.setMetric("ingest/persists/time", metrics.persistTimeMillis() - previousSegmentGenerationMetrics.persistTimeMillis()));
+    emitter.emit(builder.setMetric("ingest/persists/cpu", metrics.persistCpuTime() - previousSegmentGenerationMetrics.persistCpuTime()));
     emitter.emit(
         builder.setMetric(
             "ingest/persists/backPressure",
-            metrics.persistBackPressureMillis() - previousFireDepartmentMetrics.persistBackPressureMillis()
+            metrics.persistBackPressureMillis() - previousSegmentGenerationMetrics.persistBackPressureMillis()
         )
     );
-    emitter.emit(builder.setMetric("ingest/persists/failed", metrics.failedPersists() - previousFireDepartmentMetrics.failedPersists()));
-    emitter.emit(builder.setMetric("ingest/handoff/failed", metrics.failedHandoffs() - previousFireDepartmentMetrics.failedHandoffs()));
-    emitter.emit(builder.setMetric("ingest/merge/time", metrics.mergeTimeMillis() - previousFireDepartmentMetrics.mergeTimeMillis()));
-    emitter.emit(builder.setMetric("ingest/merge/cpu", metrics.mergeCpuTime() - previousFireDepartmentMetrics.mergeCpuTime()));
-    emitter.emit(builder.setMetric("ingest/handoff/count", metrics.handOffCount() - previousFireDepartmentMetrics.handOffCount()));
+    emitter.emit(builder.setMetric("ingest/persists/failed", metrics.failedPersists() - previousSegmentGenerationMetrics.failedPersists()));
+    emitter.emit(builder.setMetric("ingest/handoff/failed", metrics.failedHandoffs() - previousSegmentGenerationMetrics.failedHandoffs()));
+    emitter.emit(builder.setMetric("ingest/merge/time", metrics.mergeTimeMillis() - previousSegmentGenerationMetrics.mergeTimeMillis()));
+    emitter.emit(builder.setMetric("ingest/merge/cpu", metrics.mergeCpuTime() - previousSegmentGenerationMetrics.mergeCpuTime()));
+    emitter.emit(builder.setMetric("ingest/handoff/count", metrics.handOffCount() - previousSegmentGenerationMetrics.handOffCount()));
     emitter.emit(builder.setMetric("ingest/sink/count", metrics.sinkCount()));
 
     long messageGap = metrics.messageGap();
@@ -143,7 +138,7 @@ public class TaskRealtimeMetricsMonitor extends AbstractMonitor
     }
 
     previousRowIngestionMetersTotals = rowIngestionMetersTotals;
-    previousFireDepartmentMetrics = metrics;
+    previousSegmentGenerationMetrics = metrics;
     return true;
   }
 }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/AppenderatorDriverRealtimeIndexTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/AppenderatorDriverRealtimeIndexTask.java
deleted file mode 100644
index d97caaec874..00000000000
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/AppenderatorDriverRealtimeIndexTask.java
+++ /dev/null
@@ -1,853 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.indexing.common.task;
-
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonIgnore;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Supplier;
-import com.google.common.base.Throwables;
-import com.google.common.collect.ImmutableMap;
-import com.google.common.util.concurrent.Futures;
-import com.google.common.util.concurrent.ListenableFuture;
-import com.google.common.util.concurrent.MoreExecutors;
-import org.apache.druid.data.input.Committer;
-import org.apache.druid.data.input.Firehose;
-import org.apache.druid.data.input.FirehoseFactory;
-import org.apache.druid.data.input.InputRow;
-import org.apache.druid.discovery.DiscoveryDruidNode;
-import org.apache.druid.discovery.LookupNodeService;
-import org.apache.druid.discovery.NodeRole;
-import org.apache.druid.indexer.IngestionState;
-import org.apache.druid.indexer.TaskStatus;
-import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
-import org.apache.druid.indexer.report.IngestionStatsAndErrors;
-import org.apache.druid.indexer.report.IngestionStatsAndErrorsTaskReport;
-import org.apache.druid.indexer.report.TaskContextReport;
-import org.apache.druid.indexer.report.TaskReport;
-import org.apache.druid.indexing.appenderator.ActionBasedSegmentAllocator;
-import org.apache.druid.indexing.appenderator.ActionBasedUsedSegmentChecker;
-import org.apache.druid.indexing.common.LockGranularity;
-import org.apache.druid.indexing.common.TaskLock;
-import org.apache.druid.indexing.common.TaskLockType;
-import org.apache.druid.indexing.common.TaskRealtimeMetricsMonitorBuilder;
-import org.apache.druid.indexing.common.TaskToolbox;
-import org.apache.druid.indexing.common.actions.SegmentAllocateAction;
-import org.apache.druid.indexing.common.actions.SegmentLockAcquireAction;
-import org.apache.druid.indexing.common.actions.SegmentTransactionalInsertAction;
-import org.apache.druid.indexing.common.actions.TaskActionClient;
-import org.apache.druid.indexing.common.actions.TaskLocks;
-import org.apache.druid.indexing.common.actions.TimeChunkLockAcquireAction;
-import org.apache.druid.indexing.common.config.TaskConfig;
-import org.apache.druid.indexing.common.index.RealtimeAppenderatorIngestionSpec;
-import org.apache.druid.indexing.common.index.RealtimeAppenderatorTuningConfig;
-import org.apache.druid.indexing.common.stats.TaskRealtimeMetricsMonitor;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.UOE;
-import org.apache.druid.java.util.common.parsers.ParseException;
-import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.query.NoopQueryRunner;
-import org.apache.druid.query.Query;
-import org.apache.druid.query.QueryRunner;
-import org.apache.druid.segment.SegmentUtils;
-import org.apache.druid.segment.incremental.ParseExceptionHandler;
-import org.apache.druid.segment.incremental.ParseExceptionReport;
-import org.apache.druid.segment.incremental.RowIngestionMeters;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.segment.realtime.appenderator.Appenderator;
-import org.apache.druid.segment.realtime.appenderator.AppenderatorDriverAddResult;
-import org.apache.druid.segment.realtime.appenderator.SegmentsAndCommitMetadata;
-import org.apache.druid.segment.realtime.appenderator.StreamAppenderatorDriver;
-import org.apache.druid.segment.realtime.appenderator.TransactionalSegmentPublisher;
-import org.apache.druid.segment.realtime.firehose.ChatHandler;
-import org.apache.druid.segment.realtime.firehose.ClippedFirehoseFactory;
-import org.apache.druid.segment.realtime.firehose.EventReceiverFirehoseFactory;
-import org.apache.druid.segment.realtime.firehose.TimedShutoffFirehoseFactory;
-import org.apache.druid.segment.realtime.plumber.Committers;
-import org.apache.druid.server.security.Action;
-import org.apache.druid.server.security.AuthorizerMapper;
-import org.apache.druid.server.security.ResourceAction;
-import org.apache.druid.timeline.partition.NumberedPartialShardSpec;
-import org.apache.druid.utils.CloseableUtils;
-import org.checkerframework.checker.nullness.qual.MonotonicNonNull;
-
-import javax.annotation.Nonnull;
-import javax.servlet.http.HttpServletRequest;
-import javax.ws.rs.GET;
-import javax.ws.rs.Path;
-import javax.ws.rs.Produces;
-import javax.ws.rs.core.Context;
-import javax.ws.rs.core.MediaType;
-import javax.ws.rs.core.Response;
-import java.io.IOException;
-import java.util.Collections;
-import java.util.HashMap;
-import java.util.List;
-import java.util.Map;
-import java.util.Queue;
-import java.util.Set;
-import java.util.Timer;
-import java.util.TimerTask;
-import java.util.concurrent.ConcurrentLinkedQueue;
-import java.util.concurrent.CountDownLatch;
-import java.util.concurrent.ExecutionException;
-import java.util.concurrent.TimeUnit;
-import java.util.concurrent.TimeoutException;
-
-@Deprecated
-public class AppenderatorDriverRealtimeIndexTask extends AbstractTask
-    implements ChatHandler, PendingSegmentAllocatingTask
-{
-  public static final String TYPE = "index_realtime_appenderator";
-  private static final String CTX_KEY_LOOKUP_TIER = "lookupTier";
-
-  private static final EmittingLogger log = new EmittingLogger(RealtimeIndexTask.class);
-
-  private static String makeTaskId(RealtimeAppenderatorIngestionSpec spec)
-  {
-    return StringUtils.format(
-        "index_realtime_%s_%d_%s_%s",
-        spec.getDataSchema().getDataSource(),
-        spec.getTuningConfig().getShardSpec().getPartitionNum(),
-        DateTimes.nowUtc(),
-        RealtimeIndexTask.makeRandomId()
-    );
-  }
-
-  @JsonIgnore
-  private final RealtimeAppenderatorIngestionSpec spec;
-
-  @JsonIgnore
-  private final Queue<ListenableFuture<SegmentsAndCommitMetadata>> pendingHandoffs;
-
-  @JsonIgnore
-  private volatile Appenderator appenderator = null;
-
-  @JsonIgnore
-  private volatile Firehose firehose = null;
-
-  @JsonIgnore
-  private volatile FireDepartmentMetrics metrics = null;
-
-  @JsonIgnore
-  private volatile boolean gracefullyStopped = false;
-
-  @JsonIgnore
-  private volatile boolean finishingJob = false;
-
-  @JsonIgnore
-  private volatile Thread runThread = null;
-
-  @JsonIgnore
-  private final LockGranularity lockGranularity;
-
-  @JsonIgnore
-  @MonotonicNonNull
-  private ParseExceptionHandler parseExceptionHandler;
-
-  @JsonIgnore
-  @MonotonicNonNull
-  private IngestionState ingestionState;
-
-  @JsonIgnore
-  @MonotonicNonNull
-  private AuthorizerMapper authorizerMapper;
-
-  @JsonIgnore
-  @MonotonicNonNull
-  private RowIngestionMeters rowIngestionMeters;
-
-  @JsonIgnore
-  @MonotonicNonNull
-  private String errorMsg;
-
-  @JsonCreator
-  public AppenderatorDriverRealtimeIndexTask(
-      @JsonProperty("id") String id,
-      @JsonProperty("resource") TaskResource taskResource,
-      @JsonProperty("spec") RealtimeAppenderatorIngestionSpec spec,
-      @JsonProperty("context") Map<String, Object> context
-  )
-  {
-    super(
-        id == null ? makeTaskId(spec) : id,
-        StringUtils.format("index_realtime_appenderator_%s", spec.getDataSchema().getDataSource()),
-        taskResource,
-        spec.getDataSchema().getDataSource(),
-        context
-    );
-    this.spec = spec;
-    this.pendingHandoffs = new ConcurrentLinkedQueue<>();
-
-    this.ingestionState = IngestionState.NOT_STARTED;
-    this.lockGranularity = getContextValue(Tasks.FORCE_TIME_CHUNK_LOCK_KEY, Tasks.DEFAULT_FORCE_TIME_CHUNK_LOCK)
-                           ? LockGranularity.TIME_CHUNK
-                           : LockGranularity.SEGMENT;
-  }
-
-  @Override
-  public int getPriority()
-  {
-    return getContextValue(Tasks.PRIORITY_KEY, Tasks.DEFAULT_REALTIME_TASK_PRIORITY);
-  }
-
-  @Override
-  public String getType()
-  {
-    return TYPE;
-  }
-
-  @Override
-  @JsonIgnore
-  @Nonnull
-  public Set<ResourceAction> getInputSourceResources() throws UOE
-  {
-    throw new UOE(StringUtils.format(
-        "Task type [%s], does not support input source based security",
-        getType()
-    ));
-  }
-
-  @Override
-  public String getNodeType()
-  {
-    return "realtime";
-  }
-
-  @Override
-  public <T> QueryRunner<T> getQueryRunner(Query<T> query)
-  {
-    if (appenderator == null) {
-      // Not yet initialized, no data yet, just return a noop runner.
-      return new NoopQueryRunner<>();
-    }
-
-    return (queryPlus, responseContext) -> queryPlus.run(appenderator, responseContext);
-  }
-
-  @Override
-  public boolean supportsQueries()
-  {
-    return true;
-  }
-
-  @Override
-  public boolean isReady(TaskActionClient taskActionClient)
-  {
-    return true;
-  }
-
-  @Override
-  public String getTaskAllocatorId()
-  {
-    return getGroupId();
-  }
-
-  @Override
-  public TaskStatus runTask(final TaskToolbox toolbox)
-  {
-    runThread = Thread.currentThread();
-    authorizerMapper = toolbox.getAuthorizerMapper();
-    rowIngestionMeters = toolbox.getRowIngestionMetersFactory().createRowIngestionMeters();
-    parseExceptionHandler = new ParseExceptionHandler(
-        rowIngestionMeters,
-        spec.getTuningConfig().isLogParseExceptions(),
-        spec.getTuningConfig().getMaxParseExceptions(),
-        spec.getTuningConfig().getMaxSavedParseExceptions()
-    );
-
-    setupTimeoutAlert();
-
-    DataSchema dataSchema = spec.getDataSchema();
-    RealtimeAppenderatorTuningConfig tuningConfig = spec.getTuningConfig()
-                                                        .withBasePersistDirectory(toolbox.getPersistDir());
-
-    final FireDepartment fireDepartmentForMetrics =
-        new FireDepartment(dataSchema, new RealtimeIOConfig(null, null), null);
-
-    final TaskRealtimeMetricsMonitor metricsMonitor = TaskRealtimeMetricsMonitorBuilder.build(
-        this,
-        fireDepartmentForMetrics,
-        rowIngestionMeters
-    );
-
-    this.metrics = fireDepartmentForMetrics.getMetrics();
-
-    final Supplier<Committer> committerSupplier = Committers.nilSupplier();
-
-    DiscoveryDruidNode discoveryDruidNode = createDiscoveryDruidNode(toolbox);
-
-    appenderator = newAppenderator(dataSchema, tuningConfig, metrics, toolbox);
-    final TaskLockType lockType = TaskLocks.determineLockTypeForAppend(getContext());
-    StreamAppenderatorDriver driver = newDriver(dataSchema, appenderator, toolbox, metrics, lockType);
-
-    try {
-      log.debug("Found chat handler of class[%s]", toolbox.getChatHandlerProvider().getClass().getName());
-      toolbox.getChatHandlerProvider().register(getId(), this, false);
-
-      if (toolbox.getAppenderatorsManager().shouldTaskMakeNodeAnnouncements()) {
-        toolbox.getDataSegmentServerAnnouncer().announce();
-        toolbox.getDruidNodeAnnouncer().announce(discoveryDruidNode);
-      }
-
-      driver.startJob(
-          segmentId -> {
-            try {
-              if (lockGranularity == LockGranularity.SEGMENT) {
-                return toolbox.getTaskActionClient().submit(
-                    new SegmentLockAcquireAction(
-                        TaskLockType.EXCLUSIVE,
-                        segmentId.getInterval(),
-                        segmentId.getVersion(),
-                        segmentId.getShardSpec().getPartitionNum(),
-                        1000L
-                    )
-                ).isOk();
-              } else {
-                final TaskLock lock = toolbox.getTaskActionClient().submit(
-                    new TimeChunkLockAcquireAction(
-                        TaskLockType.EXCLUSIVE,
-                        segmentId.getInterval(),
-                        1000L
-                    )
-                );
-                if (lock == null) {
-                  return false;
-                }
-                lock.assertNotRevoked();
-                return true;
-              }
-            }
-            catch (IOException e) {
-              throw new RuntimeException(e);
-            }
-          }
-      );
-
-      // Set up metrics emission
-      toolbox.addMonitor(metricsMonitor);
-
-      // Delay firehose connection to avoid claiming input resources while the plumber is starting up.
-      final FirehoseFactory firehoseFactory = spec.getIOConfig().getFirehoseFactory();
-      final boolean firehoseDrainableByClosing = isFirehoseDrainableByClosing(firehoseFactory);
-
-      int sequenceNumber = 0;
-      String sequenceName = makeSequenceName(getId(), sequenceNumber);
-
-      final TransactionalSegmentPublisher publisher = (mustBeNullOrEmptyOverwriteSegments, segments, commitMetadata, map) -> {
-        if (mustBeNullOrEmptyOverwriteSegments != null && !mustBeNullOrEmptyOverwriteSegments.isEmpty()) {
-          throw new ISE(
-              "Stream ingestion task unexpectedly attempted to overwrite segments: %s",
-              SegmentUtils.commaSeparatedIdentifiers(mustBeNullOrEmptyOverwriteSegments)
-          );
-        }
-        final SegmentTransactionalInsertAction action = SegmentTransactionalInsertAction.appendAction(
-            segments,
-            null,
-            null,
-            null
-        );
-        return toolbox.getTaskActionClient().submit(action);
-      };
-
-      // Skip connecting firehose if we've been stopped before we got started.
-      synchronized (this) {
-        if (!gracefullyStopped) {
-          firehose = firehoseFactory.connect(
-              Preconditions.checkNotNull(spec.getDataSchema().getParser(), "inputRowParser"),
-              toolbox.getIndexingTmpDir()
-          );
-        }
-      }
-
-      ingestionState = IngestionState.BUILD_SEGMENTS;
-
-      // Time to read data!
-      while (!gracefullyStopped && firehoseDrainableByClosing && firehose.hasMore()) {
-        try {
-          InputRow inputRow = firehose.nextRow();
-
-          if (inputRow == null) {
-            log.debug("Discarded null row, considering thrownAway.");
-            rowIngestionMeters.incrementThrownAway();
-          } else {
-            AppenderatorDriverAddResult addResult = driver.add(inputRow, sequenceName, committerSupplier);
-
-            if (addResult.isOk()) {
-              final boolean isPushRequired = addResult.isPushRequired(
-                  tuningConfig.getPartitionsSpec().getMaxRowsPerSegment(),
-                  tuningConfig.getPartitionsSpec().getMaxTotalRowsOr(DynamicPartitionsSpec.DEFAULT_MAX_TOTAL_ROWS)
-              );
-              if (isPushRequired) {
-                publishSegments(driver, publisher, committerSupplier, sequenceName);
-                sequenceNumber++;
-                sequenceName = makeSequenceName(getId(), sequenceNumber);
-              }
-            } else {
-              // Failure to allocate segment puts determinism at risk, bail out to be safe.
-              // May want configurable behavior here at some point.
-              // If we allow continuing, then consider blacklisting the interval for a while to avoid constant checks.
-              throw new ISE("Could not allocate segment for row with timestamp[%s]", inputRow.getTimestamp());
-            }
-          }
-        }
-        catch (ParseException e) {
-          handleParseException(e);
-        }
-      }
-
-      ingestionState = IngestionState.COMPLETED;
-
-      if (!gracefullyStopped) {
-        synchronized (this) {
-          if (gracefullyStopped) {
-            // Someone called stopGracefully after we checked the flag. That's okay, just stop now.
-            log.info("Gracefully stopping.");
-          } else {
-            finishingJob = true;
-          }
-        }
-
-        if (finishingJob) {
-          log.info("Finishing job...");
-          // Publish any remaining segments
-          publishSegments(driver, publisher, committerSupplier, sequenceName);
-
-          waitForSegmentPublishAndHandoff(tuningConfig.getPublishAndHandoffTimeout());
-        }
-      } else if (firehose != null) {
-        log.info("Task was gracefully stopped, will persist data before exiting");
-
-        persistAndWait(driver, committerSupplier.get());
-      }
-    }
-    catch (Throwable e) {
-      log.makeAlert(e, "Exception aborted realtime processing[%s]", dataSchema.getDataSource())
-         .emit();
-      errorMsg = Throwables.getStackTraceAsString(e);
-      toolbox.getTaskReportFileWriter().write(getId(), getTaskCompletionReports());
-      return TaskStatus.failure(
-          getId(),
-          errorMsg
-      );
-    }
-    finally {
-      toolbox.getChatHandlerProvider().unregister(getId());
-
-      CloseableUtils.closeAndSuppressExceptions(firehose, e -> log.warn("Failed to close Firehose"));
-      appenderator.close();
-      CloseableUtils.closeAndSuppressExceptions(driver, e -> log.warn("Failed to close AppenderatorDriver"));
-
-      toolbox.removeMonitor(metricsMonitor);
-
-      if (toolbox.getAppenderatorsManager().shouldTaskMakeNodeAnnouncements()) {
-        toolbox.getDataSegmentServerAnnouncer().unannounce();
-        toolbox.getDruidNodeAnnouncer().unannounce(discoveryDruidNode);
-      }
-    }
-
-    log.info("Job done!");
-    toolbox.getTaskReportFileWriter().write(getId(), getTaskCompletionReports());
-    return TaskStatus.success(getId());
-  }
-
-  @Override
-  public boolean canRestore()
-  {
-    return true;
-  }
-
-  @Override
-  public void stopGracefully(TaskConfig taskConfig)
-  {
-    if (taskConfig.isRestoreTasksOnRestart()) {
-      try {
-        synchronized (this) {
-          if (!gracefullyStopped) {
-            gracefullyStopped = true;
-            if (firehose == null) {
-              log.info("stopGracefully: Firehose not started yet, so nothing to stop.");
-            } else if (finishingJob) {
-              log.info("stopGracefully: Interrupting finishJob.");
-              runThread.interrupt();
-            } else if (isFirehoseDrainableByClosing(spec.getIOConfig().getFirehoseFactory())) {
-              log.info("stopGracefully: Draining firehose.");
-              firehose.close();
-            } else {
-              log.info("stopGracefully: Cannot drain firehose by closing, interrupting run thread.");
-              runThread.interrupt();
-            }
-          }
-        }
-      }
-      catch (Exception e) {
-        throw new RuntimeException(e);
-      }
-    } else {
-      synchronized (this) {
-        if (!gracefullyStopped) {
-          // If task restore is not enabled, just interrupt immediately.
-          gracefullyStopped = true;
-          runThread.interrupt();
-        }
-      }
-    }
-  }
-
-  /**
-   * Public for tests.
-   */
-  @JsonIgnore
-  @VisibleForTesting
-  public Firehose getFirehose()
-  {
-    return firehose;
-  }
-
-  /**
-   * Public for tests.
-   */
-  @JsonIgnore
-  @VisibleForTesting
-  public FireDepartmentMetrics getMetrics()
-  {
-    return metrics;
-  }
-
-  @JsonIgnore
-  @VisibleForTesting
-  public RowIngestionMeters getRowIngestionMeters()
-  {
-    return rowIngestionMeters;
-  }
-
-  @JsonProperty("spec")
-  public RealtimeAppenderatorIngestionSpec getSpec()
-  {
-    return spec;
-  }
-
-
-  @GET
-  @Path("/rowStats")
-  @Produces(MediaType.APPLICATION_JSON)
-  public Response getRowStats(
-      @Context final HttpServletRequest req
-  )
-  {
-    IndexTaskUtils.datasourceAuthorizationCheck(req, Action.READ, getDataSource(), authorizerMapper);
-    Map<String, Object> returnMap = new HashMap<>();
-    Map<String, Object> totalsMap = new HashMap<>();
-    Map<String, Object> averagesMap = new HashMap<>();
-
-    totalsMap.put(
-        RowIngestionMeters.BUILD_SEGMENTS,
-        rowIngestionMeters.getTotals()
-    );
-    averagesMap.put(
-        RowIngestionMeters.BUILD_SEGMENTS,
-        rowIngestionMeters.getMovingAverages()
-    );
-
-    returnMap.put("movingAverages", averagesMap);
-    returnMap.put("totals", totalsMap);
-    return Response.ok(returnMap).build();
-  }
-
-  @GET
-  @Path("/unparseableEvents")
-  @Produces(MediaType.APPLICATION_JSON)
-  public Response getUnparseableEvents(
-      @Context final HttpServletRequest req
-  )
-  {
-    IndexTaskUtils.datasourceAuthorizationCheck(req, Action.READ, getDataSource(), authorizerMapper);
-    List<ParseExceptionReport> events = IndexTaskUtils.getReportListFromSavedParseExceptions(
-        parseExceptionHandler.getSavedParseExceptionReports()
-    );
-    return Response.ok(events).build();
-  }
-
-  /**
-   * Is a firehose from this factory drainable by closing it? If so, we should drain on stopGracefully rather than
-   * abruptly stopping.
-   * <p>
-   * This is a hack to get around the fact that the Firehose and FirehoseFactory interfaces do not help us do this.
-   * <p>
-   * Protected for tests.
-   */
-  protected boolean isFirehoseDrainableByClosing(FirehoseFactory firehoseFactory)
-  {
-    return firehoseFactory instanceof EventReceiverFirehoseFactory
-           || (firehoseFactory instanceof TimedShutoffFirehoseFactory
-               && isFirehoseDrainableByClosing(((TimedShutoffFirehoseFactory) firehoseFactory).getDelegateFactory()))
-           || (firehoseFactory instanceof ClippedFirehoseFactory
-               && isFirehoseDrainableByClosing(((ClippedFirehoseFactory) firehoseFactory).getDelegate()));
-  }
-
-  /**
-   * Return a map of reports for the task.
-   *
-   * A successfull task should always have a null errorMsg. A falied task should always have a non-null
-   * errorMsg.
-   *
-   * @return Map of reports for the task.
-   */
-  private TaskReport.ReportMap getTaskCompletionReports()
-  {
-    return TaskReport.buildTaskReports(
-        new IngestionStatsAndErrorsTaskReport(
-            getId(),
-            new IngestionStatsAndErrors(
-                ingestionState,
-                getTaskCompletionUnparseableEvents(),
-                getTaskCompletionRowStats(),
-                errorMsg,
-                errorMsg == null,
-                0L,
-                Collections.emptyMap(),
-                null,
-                null
-            )
-        ),
-        new TaskContextReport(getId(), getContext())
-    );
-  }
-
-  private Map<String, Object> getTaskCompletionUnparseableEvents()
-  {
-    Map<String, Object> unparseableEventsMap = new HashMap<>();
-    List<ParseExceptionReport> buildSegmentsParseExceptionMessages = IndexTaskUtils.getReportListFromSavedParseExceptions(
-        parseExceptionHandler.getSavedParseExceptionReports()
-    );
-    if (buildSegmentsParseExceptionMessages != null) {
-      unparseableEventsMap.put(RowIngestionMeters.BUILD_SEGMENTS, buildSegmentsParseExceptionMessages);
-    }
-    return unparseableEventsMap;
-  }
-
-  private Map<String, Object> getTaskCompletionRowStats()
-  {
-    Map<String, Object> metricsMap = new HashMap<>();
-    metricsMap.put(
-        RowIngestionMeters.BUILD_SEGMENTS,
-        rowIngestionMeters.getTotals()
-    );
-    return metricsMap;
-  }
-
-  private void handleParseException(ParseException pe)
-  {
-    parseExceptionHandler.handle(pe);
-
-    if (rowIngestionMeters.getUnparseable() + rowIngestionMeters.getProcessedWithError()
-        > spec.getTuningConfig().getMaxParseExceptions()) {
-      log.error("Max parse exceptions exceeded, terminating task...");
-      throw new RuntimeException("Max parse exceptions exceeded, terminating task...");
-    }
-  }
-
-  private void setupTimeoutAlert()
-  {
-    if (spec.getTuningConfig().getAlertTimeout() > 0) {
-      Timer timer = new Timer("RealtimeIndexTask-Timer", true);
-      timer.schedule(
-          new TimerTask()
-          {
-            @Override
-            public void run()
-            {
-              log.makeAlert(
-                  "RealtimeIndexTask for dataSource [%s] hasn't finished in configured time [%d] ms.",
-                  spec.getDataSchema().getDataSource(),
-                  spec.getTuningConfig().getAlertTimeout()
-              ).emit();
-            }
-          },
-          spec.getTuningConfig().getAlertTimeout()
-      );
-    }
-  }
-
-  private void publishSegments(
-      StreamAppenderatorDriver driver,
-      TransactionalSegmentPublisher publisher,
-      Supplier<Committer> committerSupplier,
-      String sequenceName
-  )
-  {
-    final ListenableFuture<SegmentsAndCommitMetadata> publishFuture = driver.publish(
-        publisher,
-        committerSupplier.get(),
-        Collections.singletonList(sequenceName)
-    );
-    pendingHandoffs.add(Futures.transformAsync(
-        publishFuture,
-        driver::registerHandoff,
-        MoreExecutors.directExecutor()
-    ));
-  }
-
-  private void waitForSegmentPublishAndHandoff(long timeout) throws InterruptedException, ExecutionException,
-                                                                    TimeoutException
-  {
-    if (!pendingHandoffs.isEmpty()) {
-      ListenableFuture<?> allHandoffs = Futures.allAsList(pendingHandoffs);
-      log.info("Waiting for handoffs");
-
-
-      if (timeout > 0) {
-        allHandoffs.get(timeout, TimeUnit.MILLISECONDS);
-      } else {
-        allHandoffs.get();
-      }
-    }
-  }
-
-  private void persistAndWait(StreamAppenderatorDriver driver, Committer committer)
-  {
-    try {
-      final CountDownLatch persistLatch = new CountDownLatch(1);
-      driver.persist(
-          new Committer()
-          {
-            @Override
-            public Object getMetadata()
-            {
-              return committer.getMetadata();
-            }
-
-            @Override
-            public void run()
-            {
-              try {
-                committer.run();
-              }
-              finally {
-                persistLatch.countDown();
-              }
-            }
-          }
-      );
-      persistLatch.await();
-    }
-    catch (InterruptedException e) {
-      log.debug(e, "Interrupted while finishing the job");
-    }
-    catch (Exception e) {
-      log.makeAlert(e, "Failed to finish realtime task").emit();
-      throw e;
-    }
-  }
-
-  private DiscoveryDruidNode createDiscoveryDruidNode(TaskToolbox toolbox)
-  {
-    LookupNodeService lookupNodeService = getContextValue(CTX_KEY_LOOKUP_TIER) == null ?
-                                          toolbox.getLookupNodeService() :
-                                          new LookupNodeService(getContextValue(CTX_KEY_LOOKUP_TIER));
-    return new DiscoveryDruidNode(
-        toolbox.getDruidNode(),
-        NodeRole.PEON,
-        ImmutableMap.of(
-            toolbox.getDataNodeService().getName(), toolbox.getDataNodeService(),
-            lookupNodeService.getName(), lookupNodeService
-        )
-    );
-  }
-
-  private Appenderator newAppenderator(
-      final DataSchema dataSchema,
-      final RealtimeAppenderatorTuningConfig tuningConfig,
-      final FireDepartmentMetrics metrics,
-      final TaskToolbox toolbox
-  )
-  {
-    return toolbox.getAppenderatorsManager().createRealtimeAppenderatorForTask(
-        null,
-        getId(),
-        dataSchema,
-        tuningConfig.withBasePersistDirectory(toolbox.getPersistDir()),
-        metrics,
-        toolbox.getSegmentPusher(),
-        toolbox.getJsonMapper(),
-        toolbox.getIndexIO(),
-        toolbox.getIndexMergerV9(),
-        toolbox.getQueryRunnerFactoryConglomerate(),
-        toolbox.getSegmentAnnouncer(),
-        toolbox.getEmitter(),
-        toolbox.getQueryProcessingPool(),
-        toolbox.getJoinableFactory(),
-        toolbox.getCache(),
-        toolbox.getCacheConfig(),
-        toolbox.getCachePopulatorStats(),
-        rowIngestionMeters,
-        parseExceptionHandler,
-        isUseMaxMemoryEstimates(),
-        toolbox.getCentralizedTableSchemaConfig()
-    );
-  }
-
-  private static StreamAppenderatorDriver newDriver(
-      final DataSchema dataSchema,
-      final Appenderator appenderator,
-      final TaskToolbox toolbox,
-      final FireDepartmentMetrics metrics,
-      final TaskLockType lockType
-  )
-  {
-    return new StreamAppenderatorDriver(
-        appenderator,
-        new ActionBasedSegmentAllocator(
-            toolbox.getTaskActionClient(),
-            dataSchema,
-            (schema, row, sequenceName, previousSegmentId, skipSegmentLineageCheck) -> new SegmentAllocateAction(
-                schema.getDataSource(),
-                row.getTimestamp(),
-                schema.getGranularitySpec().getQueryGranularity(),
-                schema.getGranularitySpec().getSegmentGranularity(),
-                sequenceName,
-                previousSegmentId,
-                skipSegmentLineageCheck,
-                NumberedPartialShardSpec.instance(),
-                LockGranularity.TIME_CHUNK,
-                lockType
-            )
-        ),
-        toolbox.getSegmentHandoffNotifierFactory(),
-        new ActionBasedUsedSegmentChecker(toolbox.getTaskActionClient()),
-        toolbox.getDataSegmentKiller(),
-        toolbox.getJsonMapper(),
-        metrics
-    );
-  }
-
-  private static String makeSequenceName(String taskId, int sequenceNumber)
-  {
-    return taskId + "_" + sequenceNumber;
-  }
-}
-
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/BatchAppenderators.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/BatchAppenderators.java
index e47bc0bc1c8..3a8f70d6746 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/BatchAppenderators.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/BatchAppenderators.java
@@ -27,7 +27,7 @@ import org.apache.druid.segment.incremental.ParseExceptionHandler;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
 import org.apache.druid.segment.indexing.DataSchema;
 import org.apache.druid.segment.loading.DataSegmentPusher;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.Appenderator;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorConfig;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorsManager;
@@ -39,7 +39,7 @@ public final class BatchAppenderators
   public static Appenderator newAppenderator(
       String taskId,
       AppenderatorsManager appenderatorsManager,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       TaskToolbox toolbox,
       DataSchema dataSchema,
       AppenderatorConfig appenderatorConfig,
@@ -65,7 +65,7 @@ public final class BatchAppenderators
   public static Appenderator newAppenderator(
       String taskId,
       AppenderatorsManager appenderatorsManager,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       TaskToolbox toolbox,
       DataSchema dataSchema,
       AppenderatorConfig appenderatorConfig,
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/IndexTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/IndexTask.java
index 14e37cc81c5..cc253f46a52 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/IndexTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/IndexTask.java
@@ -84,12 +84,10 @@ import org.apache.druid.segment.incremental.RowIngestionMeters;
 import org.apache.druid.segment.indexing.BatchIOConfig;
 import org.apache.druid.segment.indexing.DataSchema;
 import org.apache.druid.segment.indexing.IngestionSpec;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
 import org.apache.druid.segment.indexing.TuningConfig;
 import org.apache.druid.segment.indexing.granularity.ArbitraryGranularitySpec;
 import org.apache.druid.segment.indexing.granularity.GranularitySpec;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.Appenderator;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorConfig;
 import org.apache.druid.segment.realtime.appenderator.BaseAppenderatorDriver;
@@ -832,15 +830,9 @@ public class IndexTask extends AbstractBatchIndexTask implements ChatHandler, Pe
       final PartitionAnalysis partitionAnalysis
   ) throws IOException, InterruptedException
   {
-    final FireDepartment fireDepartmentForMetrics =
-        new FireDepartment(dataSchema, new RealtimeIOConfig(null, null), null);
-    FireDepartmentMetrics buildSegmentsFireDepartmentMetrics = fireDepartmentForMetrics.getMetrics();
-
-    final TaskRealtimeMetricsMonitor metricsMonitor = TaskRealtimeMetricsMonitorBuilder.build(
-        this,
-        fireDepartmentForMetrics,
-        buildSegmentsMeters
-    );
+    final SegmentGenerationMetrics buildSegmentsSegmentGenerationMetrics = new SegmentGenerationMetrics();
+    final TaskRealtimeMetricsMonitor metricsMonitor =
+        TaskRealtimeMetricsMonitorBuilder.build(this, buildSegmentsSegmentGenerationMetrics, buildSegmentsMeters);
     toolbox.addMonitor(metricsMonitor);
 
     final PartitionsSpec partitionsSpec = partitionAnalysis.getPartitionsSpec();
@@ -894,7 +886,7 @@ public class IndexTask extends AbstractBatchIndexTask implements ChatHandler, Pe
     final Appenderator appenderator = BatchAppenderators.newAppenderator(
         effectiveId,
         toolbox.getAppenderatorsManager(),
-        buildSegmentsFireDepartmentMetrics,
+        buildSegmentsSegmentGenerationMetrics,
         toolbox,
         dataSchema,
         tuningConfig,
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/RealtimeIndexTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/RealtimeIndexTask.java
deleted file mode 100644
index 443b72ec21a..00000000000
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/RealtimeIndexTask.java
+++ /dev/null
@@ -1,643 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.indexing.common.task;
-
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonIgnore;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Supplier;
-import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableMap;
-import org.apache.druid.data.input.Committer;
-import org.apache.druid.data.input.Firehose;
-import org.apache.druid.data.input.FirehoseFactory;
-import org.apache.druid.discovery.DiscoveryDruidNode;
-import org.apache.druid.discovery.LookupNodeService;
-import org.apache.druid.discovery.NodeRole;
-import org.apache.druid.indexer.TaskStatus;
-import org.apache.druid.indexing.common.TaskLock;
-import org.apache.druid.indexing.common.TaskLockType;
-import org.apache.druid.indexing.common.TaskRealtimeMetricsMonitorBuilder;
-import org.apache.druid.indexing.common.TaskToolbox;
-import org.apache.druid.indexing.common.actions.LockReleaseAction;
-import org.apache.druid.indexing.common.actions.TaskActionClient;
-import org.apache.druid.indexing.common.actions.TimeChunkLockAcquireAction;
-import org.apache.druid.indexing.common.config.TaskConfig;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.UOE;
-import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.query.NoopQueryRunner;
-import org.apache.druid.query.Query;
-import org.apache.druid.query.QueryRunner;
-import org.apache.druid.query.QueryRunnerFactoryConglomerate;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.segment.realtime.RealtimeMetricsMonitor;
-import org.apache.druid.segment.realtime.SegmentPublisher;
-import org.apache.druid.segment.realtime.appenderator.SegmentSchemas;
-import org.apache.druid.segment.realtime.firehose.ClippedFirehoseFactory;
-import org.apache.druid.segment.realtime.firehose.EventReceiverFirehoseFactory;
-import org.apache.druid.segment.realtime.firehose.TimedShutoffFirehoseFactory;
-import org.apache.druid.segment.realtime.plumber.Committers;
-import org.apache.druid.segment.realtime.plumber.Plumber;
-import org.apache.druid.segment.realtime.plumber.PlumberSchool;
-import org.apache.druid.segment.realtime.plumber.Plumbers;
-import org.apache.druid.segment.realtime.plumber.RealtimePlumberSchool;
-import org.apache.druid.segment.realtime.plumber.VersioningPolicy;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-import org.apache.druid.server.security.ResourceAction;
-import org.apache.druid.timeline.DataSegment;
-import org.apache.druid.utils.CloseableUtils;
-import org.joda.time.DateTime;
-import org.joda.time.Interval;
-
-import javax.annotation.Nonnull;
-import java.io.IOException;
-import java.util.Map;
-import java.util.Set;
-import java.util.Timer;
-import java.util.TimerTask;
-import java.util.concurrent.CountDownLatch;
-import java.util.concurrent.ThreadLocalRandom;
-
-@Deprecated
-public class RealtimeIndexTask extends AbstractTask
-{
-  public static final String TYPE = "index_realtime";
-  public static final String CTX_KEY_LOOKUP_TIER = "lookupTier";
-
-  private static final EmittingLogger log = new EmittingLogger(RealtimeIndexTask.class);
-
-  private static final int TASK_ID_BITS_PER_SYMBOL = 4;
-  private static final int TASK_ID_SYMBOL_MASK = (1 << TASK_ID_BITS_PER_SYMBOL) - 1;
-  private static final int TASK_ID_LENGTH = Integer.SIZE / TASK_ID_BITS_PER_SYMBOL;
-
-  public static String makeRandomId()
-  {
-    final StringBuilder suffix = new StringBuilder(TASK_ID_LENGTH);
-    int randomBits = ThreadLocalRandom.current().nextInt();
-    for (int i = 0; i < TASK_ID_LENGTH; i++) {
-      suffix.append((char) ('a' + ((randomBits >>> (i * TASK_ID_BITS_PER_SYMBOL)) & TASK_ID_SYMBOL_MASK)));
-    }
-    return suffix.toString();
-  }
-
-  private static String makeTaskId(FireDepartment fireDepartment)
-  {
-    return makeTaskId(
-        fireDepartment.getDataSchema().getDataSource(),
-        fireDepartment.getTuningConfig().getShardSpec().getPartitionNum(),
-        DateTimes.nowUtc(),
-        makeRandomId()
-    );
-  }
-
-  static String makeTaskId(String dataSource, int partitionNumber, DateTime timestamp, String suffix)
-  {
-    return StringUtils.format(
-        "index_realtime_%s_%d_%s_%s",
-        dataSource,
-        partitionNumber,
-        timestamp,
-        suffix
-    );
-  }
-
-  private static String makeDatasource(FireDepartment fireDepartment)
-  {
-    return fireDepartment.getDataSchema().getDataSource();
-  }
-
-  @JsonIgnore
-  private final FireDepartment spec;
-
-  @JsonIgnore
-  private volatile Plumber plumber = null;
-
-  @JsonIgnore
-  private volatile Firehose firehose = null;
-
-  @JsonIgnore
-  private volatile FireDepartmentMetrics metrics = null;
-
-  @JsonIgnore
-  private volatile boolean gracefullyStopped = false;
-
-  @JsonIgnore
-  private volatile boolean finishingJob = false;
-
-  @JsonIgnore
-  private volatile Thread runThread = null;
-
-  @JsonIgnore
-  private volatile QueryRunnerFactoryConglomerate queryRunnerFactoryConglomerate = null;
-
-  @JsonCreator
-  public RealtimeIndexTask(
-      @JsonProperty("id") String id,
-      @JsonProperty("resource") TaskResource taskResource,
-      @JsonProperty("spec") FireDepartment fireDepartment,
-      @JsonProperty("context") Map<String, Object> context
-  )
-  {
-    super(
-        id == null ? makeTaskId(fireDepartment) : id,
-        StringUtils.format("index_realtime_%s", makeDatasource(fireDepartment)),
-        taskResource,
-        makeDatasource(fireDepartment),
-        context
-    );
-    this.spec = fireDepartment;
-  }
-
-  @Override
-  public int getPriority()
-  {
-    return getContextValue(Tasks.PRIORITY_KEY, Tasks.DEFAULT_REALTIME_TASK_PRIORITY);
-  }
-
-  @Override
-  public String getType()
-  {
-    return TYPE;
-  }
-
-  @Override
-  @JsonIgnore
-  @Nonnull
-  public Set<ResourceAction> getInputSourceResources() throws UOE
-  {
-    throw new UOE(StringUtils.format(
-        "Task type [%s], does not support input source based security",
-        getType()
-    ));
-  }
-
-  @Override
-  public String getNodeType()
-  {
-    return "realtime";
-  }
-
-  @Override
-  public <T> QueryRunner<T> getQueryRunner(Query<T> query)
-  {
-    if (plumber == null) {
-      // Not yet initialized, no data yet, just return a noop runner.
-      return new NoopQueryRunner<>();
-    }
-
-    return plumber.getQueryRunner(query);
-  }
-
-  @Override
-  public boolean supportsQueries()
-  {
-    return true;
-  }
-
-  @Override
-  public boolean isReady(TaskActionClient taskActionClient)
-  {
-    return true;
-  }
-
-  @Override
-  public TaskStatus runTask(final TaskToolbox toolbox) throws Exception
-  {
-    runThread = Thread.currentThread();
-
-    if (this.plumber != null) {
-      throw new IllegalStateException("Plumber must be null");
-    }
-
-    setupTimeoutAlert();
-
-    boolean normalExit = true;
-
-    // It would be nice to get the PlumberSchool in the constructor.  Although that will need jackson injectables for
-    // stuff like the ServerView, which seems kind of odd?  Perhaps revisit this when Guice has been introduced.
-
-    final SegmentPublisher segmentPublisher = new TaskActionSegmentPublisher(toolbox);
-
-    // NOTE: We talk to the coordinator in various places in the plumber and we could be more robust to issues
-    // with the coordinator.  Right now, we'll block/throw in whatever thread triggered the coordinator behavior,
-    // which will typically be either the main data processing loop or the persist thread.
-
-    // Wrap default DataSegmentAnnouncer such that we unlock intervals as we unannounce segments
-    final long lockTimeoutMs = getContextValue(Tasks.LOCK_TIMEOUT_KEY, Tasks.DEFAULT_LOCK_TIMEOUT_MILLIS);
-    // Note: if lockTimeoutMs is larger than ServerConfig.maxIdleTime, http timeout error can occur while waiting for a
-    // lock to be acquired.
-    final DataSegmentAnnouncer lockingSegmentAnnouncer = new DataSegmentAnnouncer()
-    {
-      @Override
-      public void announceSegment(final DataSegment segment) throws IOException
-      {
-        // Side effect: Calling announceSegment causes a lock to be acquired
-        final TaskLock lock = Preconditions.checkNotNull(
-            toolbox.getTaskActionClient().submit(
-                new TimeChunkLockAcquireAction(TaskLockType.EXCLUSIVE, segment.getInterval(), lockTimeoutMs)
-            ),
-            "Cannot acquire a lock for interval[%s]",
-            segment.getInterval()
-        );
-        lock.assertNotRevoked();
-        toolbox.getSegmentAnnouncer().announceSegment(segment);
-      }
-
-      @Override
-      public void unannounceSegment(final DataSegment segment) throws IOException
-      {
-        try {
-          toolbox.getSegmentAnnouncer().unannounceSegment(segment);
-        }
-        finally {
-          toolbox.getTaskActionClient().submit(new LockReleaseAction(segment.getInterval()));
-        }
-      }
-
-      @Override
-      public void announceSegments(Iterable<DataSegment> segments) throws IOException
-      {
-        // Side effect: Calling announceSegments causes locks to be acquired
-        for (DataSegment segment : segments) {
-          final TaskLock lock = Preconditions.checkNotNull(
-              toolbox.getTaskActionClient().submit(
-                  new TimeChunkLockAcquireAction(TaskLockType.EXCLUSIVE, segment.getInterval(), lockTimeoutMs)
-              ),
-              "Cannot acquire a lock for interval[%s]",
-              segment.getInterval()
-          );
-          lock.assertNotRevoked();
-        }
-        toolbox.getSegmentAnnouncer().announceSegments(segments);
-      }
-
-      @Override
-      public void unannounceSegments(Iterable<DataSegment> segments) throws IOException
-      {
-        try {
-          toolbox.getSegmentAnnouncer().unannounceSegments(segments);
-        }
-        finally {
-          for (DataSegment segment : segments) {
-            toolbox.getTaskActionClient().submit(new LockReleaseAction(segment.getInterval()));
-          }
-        }
-      }
-
-      @Override
-      public void announceSegmentSchemas(String taskId, SegmentSchemas sinksSchema, SegmentSchemas sinksSchemaChange)
-      {
-      }
-
-      @Override
-      public void removeSegmentSchemasForTask(String taskId)
-      {
-      }
-    };
-
-    // NOTE: getVersion will block if there is lock contention, which will block plumber.getSink
-    // NOTE: (and thus the firehose)
-
-    // Shouldn't usually happen, since we don't expect people to submit tasks that intersect with the
-    // realtime window, but if they do it can be problematic. If we decide to care, we can use more threads in
-    // the plumber such that waiting for the coordinator doesn't block data processing.
-    final VersioningPolicy versioningPolicy = new VersioningPolicy()
-    {
-      @Override
-      public String getVersion(final Interval interval)
-      {
-        try {
-          // Side effect: Calling getVersion causes a lock to be acquired
-          final TimeChunkLockAcquireAction action = new TimeChunkLockAcquireAction(
-              TaskLockType.EXCLUSIVE,
-              interval,
-              lockTimeoutMs
-          );
-          final TaskLock lock = Preconditions.checkNotNull(
-              toolbox.getTaskActionClient().submit(action),
-              "Cannot acquire a lock for interval[%s]",
-              interval
-          );
-          lock.assertNotRevoked();
-          return lock.getVersion();
-        }
-        catch (IOException e) {
-          throw new RuntimeException(e);
-        }
-      }
-    };
-
-    DataSchema dataSchema = spec.getDataSchema();
-    RealtimeIOConfig realtimeIOConfig = spec.getIOConfig();
-    RealtimeTuningConfig tuningConfig = spec.getTuningConfig()
-                                            .withBasePersistDirectory(toolbox.getPersistDir())
-                                            .withVersioningPolicy(versioningPolicy);
-
-    final FireDepartment fireDepartment = new FireDepartment(
-        dataSchema,
-        realtimeIOConfig,
-        tuningConfig
-    );
-    this.metrics = fireDepartment.getMetrics();
-    final RealtimeMetricsMonitor metricsMonitor = TaskRealtimeMetricsMonitorBuilder.build(this, fireDepartment);
-
-    this.queryRunnerFactoryConglomerate = toolbox.getQueryRunnerFactoryConglomerate();
-
-    // NOTE: This pusher selects path based purely on global configuration and the DataSegment, which means
-    // NOTE: that redundant realtime tasks will upload to the same location. This can cause index.zip
-    // NOTE: (partitionNum_index.zip for HDFS data storage) to mismatch, or it can cause historical nodes to load
-    // NOTE: different instances of the "same" segment.
-    final PlumberSchool plumberSchool = new RealtimePlumberSchool(
-        toolbox.getEmitter(),
-        toolbox.getQueryRunnerFactoryConglomerate(),
-        toolbox.getSegmentPusher(),
-        lockingSegmentAnnouncer,
-        segmentPublisher,
-        toolbox.getSegmentHandoffNotifierFactory(),
-        toolbox.getQueryProcessingPool(),
-        toolbox.getJoinableFactory(),
-        toolbox.getIndexMergerV9(),
-        toolbox.getIndexIO(),
-        toolbox.getCache(),
-        toolbox.getCacheConfig(),
-        toolbox.getCachePopulatorStats(),
-        toolbox.getJsonMapper()
-    );
-
-    this.plumber = plumberSchool.findPlumber(dataSchema, tuningConfig, metrics);
-
-    final Supplier<Committer> committerSupplier = Committers.nilSupplier();
-
-    LookupNodeService lookupNodeService = getContextValue(CTX_KEY_LOOKUP_TIER) == null ?
-                                          toolbox.getLookupNodeService() :
-                                          new LookupNodeService((String) getContextValue(CTX_KEY_LOOKUP_TIER));
-    DiscoveryDruidNode discoveryDruidNode = new DiscoveryDruidNode(
-        toolbox.getDruidNode(),
-        NodeRole.PEON,
-        ImmutableMap.of(
-            toolbox.getDataNodeService().getName(), toolbox.getDataNodeService(),
-            lookupNodeService.getName(), lookupNodeService
-        )
-    );
-
-    try {
-      toolbox.getDataSegmentServerAnnouncer().announce();
-      toolbox.getDruidNodeAnnouncer().announce(discoveryDruidNode);
-
-
-      plumber.startJob();
-
-      // Set up metrics emission
-      toolbox.addMonitor(metricsMonitor);
-
-      // Delay firehose connection to avoid claiming input resources while the plumber is starting up.
-      final FirehoseFactory firehoseFactory = spec.getIOConfig().getFirehoseFactory();
-      final boolean firehoseDrainableByClosing = isFirehoseDrainableByClosing(firehoseFactory);
-
-      // Skip connecting firehose if we've been stopped before we got started.
-      synchronized (this) {
-        if (!gracefullyStopped) {
-          firehose = firehoseFactory.connect(
-              Preconditions.checkNotNull(spec.getDataSchema().getParser(), "inputRowParser"),
-              toolbox.getIndexingTmpDir()
-          );
-        }
-      }
-
-      // Time to read data!
-      while (firehose != null && (!gracefullyStopped || firehoseDrainableByClosing) && firehose.hasMore()) {
-        Plumbers.addNextRow(
-            committerSupplier,
-            firehose,
-            plumber,
-            tuningConfig.isReportParseExceptions(),
-            metrics
-        );
-      }
-    }
-    catch (Throwable e) {
-      normalExit = false;
-      log.makeAlert(e, "Exception aborted realtime processing[%s]", dataSchema.getDataSource())
-         .emit();
-      throw e;
-    }
-    finally {
-      if (normalExit) {
-        try {
-          // Persist if we had actually started.
-          if (firehose != null) {
-            log.info("Persisting remaining data.");
-
-            final Committer committer = committerSupplier.get();
-            final CountDownLatch persistLatch = new CountDownLatch(1);
-            plumber.persist(
-                new Committer()
-                {
-                  @Override
-                  public Object getMetadata()
-                  {
-                    return committer.getMetadata();
-                  }
-
-                  @Override
-                  public void run()
-                  {
-                    try {
-                      committer.run();
-                    }
-                    finally {
-                      persistLatch.countDown();
-                    }
-                  }
-                }
-            );
-            persistLatch.await();
-          }
-
-          if (gracefullyStopped) {
-            log.info("Gracefully stopping.");
-          } else {
-            log.info("Finishing the job.");
-            synchronized (this) {
-              if (gracefullyStopped) {
-                // Someone called stopGracefully after we checked the flag. That's okay, just stop now.
-                log.info("Gracefully stopping.");
-              } else {
-                finishingJob = true;
-              }
-            }
-
-            if (finishingJob) {
-              plumber.finishJob();
-            }
-          }
-        }
-        catch (InterruptedException e) {
-          log.debug(e, "Interrupted while finishing the job");
-        }
-        catch (Exception e) {
-          log.makeAlert(e, "Failed to finish realtime task").emit();
-          throw e;
-        }
-        finally {
-          if (firehose != null) {
-            CloseableUtils.closeAndSuppressExceptions(firehose, e -> log.warn("Failed to close Firehose"));
-          }
-          toolbox.removeMonitor(metricsMonitor);
-        }
-      }
-
-      toolbox.getDataSegmentServerAnnouncer().unannounce();
-      toolbox.getDruidNodeAnnouncer().unannounce(discoveryDruidNode);
-    }
-
-    log.info("Job done!");
-    return TaskStatus.success(getId());
-  }
-
-  @Override
-  public boolean canRestore()
-  {
-    return true;
-  }
-
-  @Override
-  public void stopGracefully(TaskConfig taskConfig)
-  {
-    if (taskConfig.isRestoreTasksOnRestart()) {
-      try {
-        synchronized (this) {
-          if (!gracefullyStopped) {
-            gracefullyStopped = true;
-            if (firehose == null) {
-              log.info("stopGracefully: Firehose not started yet, so nothing to stop.");
-            } else if (finishingJob) {
-              log.info("stopGracefully: Interrupting finishJob.");
-              runThread.interrupt();
-            } else if (isFirehoseDrainableByClosing(spec.getIOConfig().getFirehoseFactory())) {
-              log.info("stopGracefully: Draining firehose.");
-              firehose.close();
-            } else {
-              log.info("stopGracefully: Cannot drain firehose by closing, interrupting run thread.");
-              runThread.interrupt();
-            }
-          }
-        }
-      }
-      catch (Exception e) {
-        throw new RuntimeException(e);
-      }
-    } else {
-      synchronized (this) {
-        if (!gracefullyStopped) {
-          // If task restore is not enabled, just interrupt immediately.
-          gracefullyStopped = true;
-          runThread.interrupt();
-        }
-      }
-    }
-  }
-
-  /**
-   * Public for tests.
-   */
-  @JsonIgnore
-  public Firehose getFirehose()
-  {
-    return firehose;
-  }
-
-  /**
-   * Public for tests.
-   */
-  @JsonIgnore
-  public FireDepartmentMetrics getMetrics()
-  {
-    return metrics;
-  }
-
-  @JsonProperty("spec")
-  public FireDepartment getRealtimeIngestionSchema()
-  {
-    return spec;
-  }
-
-  /**
-   * Is a firehose from this factory drainable by closing it? If so, we should drain on stopGracefully rather than
-   * abruptly stopping.
-   *
-   * This is a hack to get around the fact that the Firehose and FirehoseFactory interfaces do not help us do this.
-   *
-   * Protected for tests.
-   */
-  protected boolean isFirehoseDrainableByClosing(FirehoseFactory firehoseFactory)
-  {
-    return firehoseFactory instanceof EventReceiverFirehoseFactory
-           || (firehoseFactory instanceof TimedShutoffFirehoseFactory
-               && isFirehoseDrainableByClosing(((TimedShutoffFirehoseFactory) firehoseFactory).getDelegateFactory()))
-           || (firehoseFactory instanceof ClippedFirehoseFactory
-               && isFirehoseDrainableByClosing(((ClippedFirehoseFactory) firehoseFactory).getDelegate()));
-  }
-
-  public static class TaskActionSegmentPublisher implements SegmentPublisher
-  {
-    final TaskToolbox taskToolbox;
-
-    public TaskActionSegmentPublisher(TaskToolbox taskToolbox)
-    {
-      this.taskToolbox = taskToolbox;
-    }
-
-    @Override
-    public void publishSegment(DataSegment segment) throws IOException
-    {
-      taskToolbox.publishSegments(ImmutableList.of(segment));
-    }
-  }
-
-  private void setupTimeoutAlert()
-  {
-    if (spec.getTuningConfig().getAlertTimeout() > 0) {
-      Timer timer = new Timer("RealtimeIndexTask-Timer", true);
-      timer.schedule(
-          new TimerTask()
-          {
-            @Override
-            public void run()
-            {
-              log.makeAlert(
-                  "RealtimeIndexTask for dataSource [%s] hasn't finished in configured time [%d] ms.",
-                  spec.getDataSchema().getDataSource(),
-                  spec.getTuningConfig().getAlertTimeout()
-              ).emit();
-            }
-          },
-          spec.getTuningConfig().getAlertTimeout()
-      );
-    }
-  }
-}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/Task.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/Task.java
index 18d2ac7d696..4fb4bb7852c 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/Task.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/Task.java
@@ -81,8 +81,6 @@ import java.util.Set;
     @Type(name = PartialDimensionDistributionTask.TYPE, value = PartialDimensionDistributionTask.class),
     @Type(name = PartialGenericSegmentMergeTask.TYPE, value = PartialGenericSegmentMergeTask.class),
     @Type(name = HadoopIndexTask.TYPE, value = HadoopIndexTask.class),
-    @Type(name = RealtimeIndexTask.TYPE, value = RealtimeIndexTask.class),
-    @Type(name = AppenderatorDriverRealtimeIndexTask.TYPE, value = AppenderatorDriverRealtimeIndexTask.class),
     @Type(name = NoopTask.TYPE, value = NoopTask.class),
     @Type(name = CompactionTask.TYPE, value = CompactionTask.class)
 })
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentGenerateTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentGenerateTask.java
index d051038634c..c53557c6655 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentGenerateTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentGenerateTask.java
@@ -46,9 +46,7 @@ import org.apache.druid.segment.incremental.ParseExceptionHandler;
 import org.apache.druid.segment.incremental.ParseExceptionReport;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.Appenderator;
 import org.apache.druid.segment.realtime.appenderator.BatchAppenderatorDriver;
 import org.apache.druid.segment.realtime.appenderator.SegmentAllocator;
@@ -171,19 +169,10 @@ abstract class PartialSegmentGenerateTask<T extends GeneratedPartitionsReport> e
   ) throws IOException, InterruptedException, ExecutionException, TimeoutException
   {
     final DataSchema dataSchema = ingestionSchema.getDataSchema();
-    final FireDepartment fireDepartmentForMetrics = new FireDepartment(
-        dataSchema,
-        new RealtimeIOConfig(null, null),
-        null
-    );
-    final FireDepartmentMetrics fireDepartmentMetrics = fireDepartmentForMetrics.getMetrics();
+    final SegmentGenerationMetrics segmentGenerationMetrics = new SegmentGenerationMetrics();
     buildSegmentsMeters = toolbox.getRowIngestionMetersFactory().createRowIngestionMeters();
-
-    TaskRealtimeMetricsMonitor metricsMonitor = TaskRealtimeMetricsMonitorBuilder.build(
-        this,
-        fireDepartmentForMetrics,
-        buildSegmentsMeters
-    );
+    final TaskRealtimeMetricsMonitor metricsMonitor =
+        TaskRealtimeMetricsMonitorBuilder.build(this, segmentGenerationMetrics, buildSegmentsMeters);
     toolbox.addMonitor(metricsMonitor);
 
     final ParallelIndexTuningConfig tuningConfig = ingestionSchema.getTuningConfig();
@@ -206,7 +195,7 @@ abstract class PartialSegmentGenerateTask<T extends GeneratedPartitionsReport> e
     final Appenderator appenderator = BatchAppenderators.newAppenderator(
         getId(),
         toolbox.getAppenderatorsManager(),
-        fireDepartmentMetrics,
+        segmentGenerationMetrics,
         toolbox,
         dataSchema,
         tuningConfig,
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/SinglePhaseSubTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/SinglePhaseSubTask.java
index b8027fcc5ea..cd05e50ff1c 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/SinglePhaseSubTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/SinglePhaseSubTask.java
@@ -57,12 +57,10 @@ import org.apache.druid.segment.incremental.ParseExceptionHandler;
 import org.apache.druid.segment.incremental.ParseExceptionReport;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
 import org.apache.druid.segment.indexing.granularity.ArbitraryGranularitySpec;
 import org.apache.druid.segment.indexing.granularity.GranularitySpec;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.Appenderator;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorDriverAddResult;
 import org.apache.druid.segment.realtime.appenderator.BaseAppenderatorDriver;
@@ -368,15 +366,9 @@ public class SinglePhaseSubTask extends AbstractBatchSubtask implements ChatHand
   {
     final DataSchema dataSchema = ingestionSchema.getDataSchema();
     final GranularitySpec granularitySpec = dataSchema.getGranularitySpec();
-    final FireDepartment fireDepartmentForMetrics =
-        new FireDepartment(dataSchema, new RealtimeIOConfig(null, null), null);
-    final FireDepartmentMetrics fireDepartmentMetrics = fireDepartmentForMetrics.getMetrics();
-
-    TaskRealtimeMetricsMonitor metricsMonitor = TaskRealtimeMetricsMonitorBuilder.build(
-        this,
-        fireDepartmentForMetrics,
-        rowIngestionMeters
-    );
+    final SegmentGenerationMetrics segmentGenerationMetrics = new SegmentGenerationMetrics();
+    final TaskRealtimeMetricsMonitor metricsMonitor =
+        TaskRealtimeMetricsMonitorBuilder.build(this, segmentGenerationMetrics, rowIngestionMeters);
     toolbox.addMonitor(metricsMonitor);
 
     final ParallelIndexTuningConfig tuningConfig = ingestionSchema.getTuningConfig();
@@ -409,7 +401,7 @@ public class SinglePhaseSubTask extends AbstractBatchSubtask implements ChatHand
     final Appenderator appenderator = BatchAppenderators.newAppenderator(
         getId(),
         toolbox.getAppenderatorsManager(),
-        fireDepartmentMetrics,
+        segmentGenerationMetrics,
         toolbox,
         dataSchema,
         tuningConfig,
@@ -461,8 +453,6 @@ public class SinglePhaseSubTask extends AbstractBatchSubtask implements ChatHand
         } else {
           throw new ISE("Failed to add a row with timestamp[%s]", inputRow.getTimestamp());
         }
-
-        fireDepartmentMetrics.incrementProcessed();
       }
 
       final SegmentsAndCommitMetadata pushed = driver.pushAllAndClear(pushTimeout);
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/overlord/supervisor/SupervisorManager.java b/indexing-service/src/main/java/org/apache/druid/indexing/overlord/supervisor/SupervisorManager.java
index 2fab1ed9bd1..1267bb645a6 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/overlord/supervisor/SupervisorManager.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/overlord/supervisor/SupervisorManager.java
@@ -38,7 +38,6 @@ import org.apache.druid.query.QueryContexts;
 import org.apache.druid.segment.incremental.ParseExceptionReport;
 
 import javax.annotation.Nullable;
-
 import java.util.List;
 import java.util.Map;
 import java.util.Set;
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTask.java
index 0ec9a67e8c1..f8e78bb711d 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTask.java
@@ -49,7 +49,7 @@ import org.apache.druid.query.QueryRunner;
 import org.apache.druid.segment.incremental.ParseExceptionHandler;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.Appenderator;
 import org.apache.druid.segment.realtime.appenderator.StreamAppenderatorDriver;
 import org.apache.druid.segment.realtime.firehose.ChatHandler;
@@ -182,7 +182,7 @@ public abstract class SeekableStreamIndexTask<PartitionIdType, SequenceOffsetTyp
 
   public Appenderator newAppenderator(
       TaskToolbox toolbox,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       RowIngestionMeters rowIngestionMeters,
       ParseExceptionHandler parseExceptionHandler
   )
@@ -215,7 +215,7 @@ public abstract class SeekableStreamIndexTask<PartitionIdType, SequenceOffsetTyp
   public StreamAppenderatorDriver newDriver(
       final Appenderator appenderator,
       final TaskToolbox toolbox,
-      final FireDepartmentMetrics metrics
+      final SegmentGenerationMetrics metrics
   )
   {
     return new StreamAppenderatorDriver(
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java
index b5eefcdbc96..2fbad2c2224 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java
@@ -67,7 +67,6 @@ import org.apache.druid.indexing.common.actions.TaskLocks;
 import org.apache.druid.indexing.common.actions.TimeChunkLockAcquireAction;
 import org.apache.druid.indexing.common.stats.TaskRealtimeMetricsMonitor;
 import org.apache.druid.indexing.common.task.IndexTaskUtils;
-import org.apache.druid.indexing.common.task.RealtimeIndexTask;
 import org.apache.druid.indexing.input.InputRowSchemas;
 import org.apache.druid.indexing.seekablestream.common.OrderedPartitionableRecord;
 import org.apache.druid.indexing.seekablestream.common.OrderedSequenceNumber;
@@ -82,9 +81,7 @@ import org.apache.druid.metadata.PendingSegmentRecord;
 import org.apache.druid.segment.incremental.ParseExceptionHandler;
 import org.apache.druid.segment.incremental.ParseExceptionReport;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.Appenderator;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorDriverAddResult;
 import org.apache.druid.segment.realtime.appenderator.SegmentsAndCommitMetadata;
@@ -147,6 +144,8 @@ import java.util.stream.Collectors;
 @SuppressWarnings("CheckReturnValue")
 public abstract class SeekableStreamIndexTaskRunner<PartitionIdType, SequenceOffsetType, RecordType extends ByteEntity> implements ChatHandler
 {
+  private static final String CTX_KEY_LOOKUP_TIER = "lookupTier";
+
   public enum Status
   {
     NOT_STARTED,
@@ -226,7 +225,7 @@ public abstract class SeekableStreamIndexTaskRunner<PartitionIdType, SequenceOff
   @MonotonicNonNull
   private ParseExceptionHandler parseExceptionHandler;
   @MonotonicNonNull
-  private FireDepartmentMetrics fireDepartmentMetrics;
+  private SegmentGenerationMetrics segmentGenerationMetrics;
 
   @MonotonicNonNull
   private AuthorizerMapper authorizerMapper;
@@ -401,17 +400,13 @@ public abstract class SeekableStreamIndexTaskRunner<PartitionIdType, SequenceOff
 
     runThread = Thread.currentThread();
 
-    // Set up FireDepartmentMetrics
-    final FireDepartment fireDepartmentForMetrics = new FireDepartment(
-        task.getDataSchema(),
-        new RealtimeIOConfig(null, null),
-        null
-    );
-    this.fireDepartmentMetrics = fireDepartmentForMetrics.getMetrics();
-    TaskRealtimeMetricsMonitor metricsMonitor = TaskRealtimeMetricsMonitorBuilder.build(task, fireDepartmentForMetrics, rowIngestionMeters);
+    // Set up SegmentGenerationMetrics
+    this.segmentGenerationMetrics = new SegmentGenerationMetrics();
+    final TaskRealtimeMetricsMonitor metricsMonitor =
+        TaskRealtimeMetricsMonitorBuilder.build(task, segmentGenerationMetrics, rowIngestionMeters);
     toolbox.addMonitor(metricsMonitor);
 
-    final String lookupTier = task.getContextValue(RealtimeIndexTask.CTX_KEY_LOOKUP_TIER);
+    final String lookupTier = task.getContextValue(CTX_KEY_LOOKUP_TIER);
     final LookupNodeService lookupNodeService = lookupTier == null ?
                                                 toolbox.getLookupNodeService() :
                                                 new LookupNodeService(lookupTier);
@@ -436,8 +431,8 @@ public abstract class SeekableStreamIndexTaskRunner<PartitionIdType, SequenceOff
         toolbox.getDataSegmentServerAnnouncer().announce();
         toolbox.getDruidNodeAnnouncer().announce(discoveryDruidNode);
       }
-      appenderator = task.newAppenderator(toolbox, fireDepartmentMetrics, rowIngestionMeters, parseExceptionHandler);
-      driver = task.newDriver(appenderator, toolbox, fireDepartmentMetrics);
+      appenderator = task.newAppenderator(toolbox, segmentGenerationMetrics, rowIngestionMeters, parseExceptionHandler);
+      driver = task.newDriver(appenderator, toolbox, segmentGenerationMetrics);
 
       // Start up, set up initial sequences.
       final Object restoredMetadata = driver.startJob(
@@ -739,7 +734,7 @@ public abstract class SeekableStreamIndexTaskRunner<PartitionIdType, SequenceOff
           if (!stillReading) {
             // We let the fireDepartmentMetrics know that all messages have been read. This way, some metrics such as
             // high message gap need not be reported
-            fireDepartmentMetrics.markProcessingDone();
+            segmentGenerationMetrics.markProcessingDone();
           }
 
           if (System.currentTimeMillis() > nextCheckpointTime) {
@@ -784,7 +779,7 @@ public abstract class SeekableStreamIndexTaskRunner<PartitionIdType, SequenceOff
       finally {
         try {
           // To handle cases where tasks stop reading due to stop request or exceptions
-          fireDepartmentMetrics.markProcessingDone();
+          segmentGenerationMetrics.markProcessingDone();
           driver.persist(committerSupplier.get()); // persist pending data
         }
         catch (Exception e) {
@@ -1442,9 +1437,9 @@ public abstract class SeekableStreamIndexTaskRunner<PartitionIdType, SequenceOff
   }
 
   @VisibleForTesting
-  public FireDepartmentMetrics getFireDepartmentMetrics()
+  public SegmentGenerationMetrics getSegmentGenerationMetrics()
   {
-    return fireDepartmentMetrics;
+    return segmentGenerationMetrics;
   }
 
   public void stopForcefully()
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskTuningConfig.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskTuningConfig.java
index 204d1b3e7a3..34e4c5f0f2d 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskTuningConfig.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskTuningConfig.java
@@ -23,7 +23,6 @@ import com.fasterxml.jackson.annotation.JsonProperty;
 import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.segment.IndexSpec;
 import org.apache.druid.segment.incremental.AppendableIndexSpec;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
 import org.apache.druid.segment.indexing.TuningConfig;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorConfig;
 import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
@@ -31,12 +30,17 @@ import org.joda.time.Period;
 
 import javax.annotation.Nullable;
 import java.io.File;
+import java.time.Duration;
 import java.util.Objects;
 
 public abstract class SeekableStreamIndexTaskTuningConfig implements AppenderatorConfig
 {
   private static final boolean DEFAULT_RESET_OFFSET_AUTOMATICALLY = false;
   private static final boolean DEFAULT_SKIP_SEQUENCE_NUMBER_AVAILABILITY_CHECK = false;
+  private static final Period DEFAULT_INTERMEDIATE_PERSIST_PERIOD = new Period("PT10M");
+  private static final IndexSpec DEFAULT_INDEX_SPEC = IndexSpec.DEFAULT;
+  private static final Boolean DEFAULT_REPORT_PARSE_EXCEPTIONS = Boolean.FALSE;
+  private static final long DEFAULT_HANDOFF_CONDITION_TIMEOUT = Duration.ofMinutes(15).toMillis();
 
   private final AppendableIndexSpec appendableIndexSpec;
   private final int maxRowsInMemory;
@@ -87,30 +91,26 @@ public abstract class SeekableStreamIndexTaskTuningConfig implements Appenderato
       @Nullable Integer numPersistThreads
   )
   {
-    // Cannot be a static because default basePersistDirectory is unique per-instance
-    final RealtimeTuningConfig defaults = RealtimeTuningConfig.makeDefaultTuningConfig(basePersistDirectory);
-
     this.appendableIndexSpec = appendableIndexSpec == null ? DEFAULT_APPENDABLE_INDEX : appendableIndexSpec;
-    this.maxRowsInMemory = maxRowsInMemory == null ? defaults.getMaxRowsInMemory() : maxRowsInMemory;
+    this.maxRowsInMemory = maxRowsInMemory == null ? DEFAULT_MAX_ROWS_IN_MEMORY_REALTIME : maxRowsInMemory;
     this.partitionsSpec = new DynamicPartitionsSpec(maxRowsPerSegment, maxTotalRows);
     // initializing this to 0, it will be lazily initialized to a value
     // @see #getMaxBytesInMemoryOrDefault()
     this.maxBytesInMemory = maxBytesInMemory == null ? 0 : maxBytesInMemory;
     this.skipBytesInMemoryOverheadCheck = skipBytesInMemoryOverheadCheck == null ?
                                           DEFAULT_SKIP_BYTES_IN_MEMORY_OVERHEAD_CHECK : skipBytesInMemoryOverheadCheck;
-    this.intermediatePersistPeriod = intermediatePersistPeriod == null
-                                     ? defaults.getIntermediatePersistPeriod()
-                                     : intermediatePersistPeriod;
+    this.intermediatePersistPeriod =
+        intermediatePersistPeriod == null ? DEFAULT_INTERMEDIATE_PERSIST_PERIOD : intermediatePersistPeriod;
     this.basePersistDirectory = basePersistDirectory;
     this.maxPendingPersists = maxPendingPersists == null ? 0 : maxPendingPersists;
-    this.indexSpec = indexSpec == null ? defaults.getIndexSpec() : indexSpec;
+    this.indexSpec = indexSpec == null ? DEFAULT_INDEX_SPEC : indexSpec;
     this.indexSpecForIntermediatePersists = indexSpecForIntermediatePersists == null ?
                                             this.indexSpec : indexSpecForIntermediatePersists;
     this.reportParseExceptions = reportParseExceptions == null
-                                 ? defaults.isReportParseExceptions()
+                                 ? DEFAULT_REPORT_PARSE_EXCEPTIONS
                                  : reportParseExceptions;
     this.handoffConditionTimeout = handoffConditionTimeout == null
-                                   ? defaults.getHandoffConditionTimeout()
+                                   ? DEFAULT_HANDOFF_CONDITION_TIMEOUT
                                    : handoffConditionTimeout;
     this.resetOffsetAutomatically = resetOffsetAutomatically == null
                                     ? DEFAULT_RESET_OFFSET_AUTOMATICALLY
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SettableByteEntity.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SettableByteEntity.java
index bac59d4b3f0..b4eb42a6b48 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SettableByteEntity.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SettableByteEntity.java
@@ -27,7 +27,6 @@ import org.apache.druid.java.util.common.IAE;
 
 import javax.annotation.Nullable;
 import javax.annotation.concurrent.NotThreadSafe;
-
 import java.io.InputStream;
 import java.net.URI;
 import java.nio.ByteBuffer;
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/TaskRealtimeMetricsMonitorTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/TaskRealtimeMetricsMonitorTest.java
index b50e68d13c7..f6bea0917f0 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/TaskRealtimeMetricsMonitorTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/TaskRealtimeMetricsMonitorTest.java
@@ -27,7 +27,7 @@ import org.apache.druid.java.util.emitter.service.ServiceEventBuilder;
 import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 import org.apache.druid.query.DruidMetrics;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
-import org.apache.druid.segment.realtime.FireDepartment;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Test;
@@ -54,7 +54,7 @@ public class TaskRealtimeMetricsMonitorTest
   private static final Map<String, Object> TAGS = ImmutableMap.of("author", "Author Name", "version", 10);
 
   @Mock(answer = Answers.RETURNS_MOCKS)
-  private FireDepartment fireDepartment;
+  private SegmentGenerationMetrics segmentGenerationMetrics;
   @Mock(answer = Answers.RETURNS_MOCKS)
   private RowIngestionMeters rowIngestionMeters;
   @Mock
@@ -74,7 +74,7 @@ public class TaskRealtimeMetricsMonitorTest
           return null;
         })
         .when(emitter).emit(ArgumentMatchers.any(Event.class));
-    target = new TaskRealtimeMetricsMonitor(fireDepartment, rowIngestionMeters, DIMENSIONS, TAGS);
+    target = new TaskRealtimeMetricsMonitor(segmentGenerationMetrics, rowIngestionMeters, DIMENSIONS, TAGS);
   }
 
   @Test
@@ -89,7 +89,7 @@ public class TaskRealtimeMetricsMonitorTest
   @Test
   public void testdoMonitorWithoutTagsShouldNotEmitTags()
   {
-    target = new TaskRealtimeMetricsMonitor(fireDepartment, rowIngestionMeters, DIMENSIONS, null);
+    target = new TaskRealtimeMetricsMonitor(segmentGenerationMetrics, rowIngestionMeters, DIMENSIONS, null);
     for (ServiceMetricEvent sme : emittedEvents.values()) {
       Assert.assertFalse(sme.getUserDims().containsKey(DruidMetrics.TAGS));
     }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/RetrieveSegmentsActionsTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/RetrieveSegmentsActionsTest.java
index 915385e811e..fec0c8e59fd 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/RetrieveSegmentsActionsTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/RetrieveSegmentsActionsTest.java
@@ -33,7 +33,6 @@ import org.junit.BeforeClass;
 import org.junit.ClassRule;
 import org.junit.Test;
 
-import java.io.IOException;
 import java.util.HashSet;
 import java.util.Set;
 
@@ -51,7 +50,7 @@ public class RetrieveSegmentsActionsTest
   private static Set<DataSegment> expectedUsedSegments;
 
   @BeforeClass
-  public static void setup() throws IOException
+  public static void setup()
   {
     task = NoopTask.create();
 
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionTest.java
index 1857f6d67f7..02a3da0e1d0 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionTest.java
@@ -60,7 +60,6 @@ import org.junit.Test;
 import org.junit.runner.RunWith;
 import org.junit.runners.Parameterized;
 
-import java.io.IOException;
 import java.time.Duration;
 import java.util.Collections;
 import java.util.HashMap;
@@ -404,7 +403,7 @@ public class SegmentAllocateActionTest
   }
 
   @Test
-  public void testSegmentIsAllocatedForLatestUsedSegmentVersion() throws IOException
+  public void testSegmentIsAllocatedForLatestUsedSegmentVersion()
   {
     final Task task = NoopTask.create();
     taskActionTestKit.getTaskLockbox().add(task);
@@ -636,7 +635,7 @@ public class SegmentAllocateActionTest
   }
 
   @Test
-  public void testAddToExistingLinearShardSpecsSameGranularity() throws Exception
+  public void testAddToExistingLinearShardSpecsSameGranularity()
   {
     final Task task = NoopTask.create();
 
@@ -702,7 +701,7 @@ public class SegmentAllocateActionTest
   }
 
   @Test
-  public void testAddToExistingNumberedShardSpecsSameGranularity() throws Exception
+  public void testAddToExistingNumberedShardSpecsSameGranularity()
   {
     final Task task = NoopTask.create();
 
@@ -766,7 +765,7 @@ public class SegmentAllocateActionTest
   }
 
   @Test
-  public void testAddToExistingNumberedShardSpecsCoarserPreferredGranularity() throws Exception
+  public void testAddToExistingNumberedShardSpecsCoarserPreferredGranularity()
   {
     final Task task = NoopTask.create();
 
@@ -806,7 +805,7 @@ public class SegmentAllocateActionTest
   }
 
   @Test
-  public void testAddToExistingNumberedShardSpecsFinerPreferredGranularity() throws Exception
+  public void testAddToExistingNumberedShardSpecsFinerPreferredGranularity()
   {
     final Task task = NoopTask.create();
 
@@ -846,7 +845,7 @@ public class SegmentAllocateActionTest
   }
 
   @Test
-  public void testCannotAddToExistingNumberedShardSpecsWithCoarserQueryGranularity() throws Exception
+  public void testCannotAddToExistingNumberedShardSpecsWithCoarserQueryGranularity()
   {
     final Task task = NoopTask.create();
 
@@ -889,7 +888,7 @@ public class SegmentAllocateActionTest
   }
 
   @Test
-  public void testWithPartialShardSpecAndOvershadowingSegments() throws IOException
+  public void testWithPartialShardSpecAndOvershadowingSegments()
   {
     final Task task = NoopTask.create();
     taskActionTestKit.getTaskLockbox().add(task);
@@ -1065,7 +1064,7 @@ public class SegmentAllocateActionTest
   }
 
   @Test
-  public void testSegmentIdMustNotBeReused() throws IOException
+  public void testSegmentIdMustNotBeReused()
   {
     final IndexerMetadataStorageCoordinator coordinator = taskActionTestKit.getMetadataStorageCoordinator();
     final TaskLockbox lockbox = taskActionTestKit.getTaskLockbox();
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/AppenderatorDriverRealtimeIndexTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/AppenderatorDriverRealtimeIndexTaskTest.java
deleted file mode 100644
index b6383cb1659..00000000000
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/AppenderatorDriverRealtimeIndexTaskTest.java
+++ /dev/null
@@ -1,1706 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.indexing.common.task;
-
-import com.fasterxml.jackson.core.type.TypeReference;
-import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.Iterables;
-import com.google.common.util.concurrent.ListenableFuture;
-import com.google.common.util.concurrent.ListeningExecutorService;
-import com.google.common.util.concurrent.MoreExecutors;
-import org.apache.commons.io.FileUtils;
-import org.apache.druid.client.cache.CacheConfig;
-import org.apache.druid.client.cache.CachePopulatorStats;
-import org.apache.druid.client.cache.MapCache;
-import org.apache.druid.client.coordinator.NoopCoordinatorClient;
-import org.apache.druid.client.indexing.NoopOverlordClient;
-import org.apache.druid.common.config.NullHandling;
-import org.apache.druid.data.input.Firehose;
-import org.apache.druid.data.input.FirehoseFactory;
-import org.apache.druid.data.input.InputRow;
-import org.apache.druid.data.input.impl.DimensionsSpec;
-import org.apache.druid.data.input.impl.FloatDimensionSchema;
-import org.apache.druid.data.input.impl.InputRowParser;
-import org.apache.druid.data.input.impl.LongDimensionSchema;
-import org.apache.druid.data.input.impl.MapInputRowParser;
-import org.apache.druid.data.input.impl.StringDimensionSchema;
-import org.apache.druid.data.input.impl.TimeAndDimsParseSpec;
-import org.apache.druid.data.input.impl.TimestampSpec;
-import org.apache.druid.discovery.DataNodeService;
-import org.apache.druid.discovery.DruidNodeAnnouncer;
-import org.apache.druid.discovery.LookupNodeService;
-import org.apache.druid.error.DruidException;
-import org.apache.druid.indexer.IngestionState;
-import org.apache.druid.indexer.TaskState;
-import org.apache.druid.indexer.TaskStatus;
-import org.apache.druid.indexer.report.IngestionStatsAndErrors;
-import org.apache.druid.indexer.report.SingleFileTaskReportFileWriter;
-import org.apache.druid.indexer.report.TaskReport;
-import org.apache.druid.indexing.common.SegmentCacheManagerFactory;
-import org.apache.druid.indexing.common.TaskToolbox;
-import org.apache.druid.indexing.common.TaskToolboxFactory;
-import org.apache.druid.indexing.common.TestUtils;
-import org.apache.druid.indexing.common.actions.LocalTaskActionClientFactory;
-import org.apache.druid.indexing.common.actions.TaskActionClientFactory;
-import org.apache.druid.indexing.common.actions.TaskActionToolbox;
-import org.apache.druid.indexing.common.actions.TaskAuditLogConfig;
-import org.apache.druid.indexing.common.config.TaskConfig;
-import org.apache.druid.indexing.common.config.TaskConfigBuilder;
-import org.apache.druid.indexing.common.config.TaskStorageConfig;
-import org.apache.druid.indexing.common.index.RealtimeAppenderatorIngestionSpec;
-import org.apache.druid.indexing.common.index.RealtimeAppenderatorTuningConfig;
-import org.apache.druid.indexing.overlord.DataSourceMetadata;
-import org.apache.druid.indexing.overlord.HeapMemoryTaskStorage;
-import org.apache.druid.indexing.overlord.SegmentPublishResult;
-import org.apache.druid.indexing.overlord.TaskLockbox;
-import org.apache.druid.indexing.overlord.TaskStorage;
-import org.apache.druid.indexing.overlord.supervisor.SupervisorManager;
-import org.apache.druid.indexing.test.TestDataSegmentAnnouncer;
-import org.apache.druid.indexing.test.TestDataSegmentKiller;
-import org.apache.druid.indexing.test.TestDataSegmentPusher;
-import org.apache.druid.jackson.DefaultObjectMapper;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.Pair;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.UOE;
-import org.apache.druid.java.util.common.concurrent.Execs;
-import org.apache.druid.java.util.common.granularity.Granularities;
-import org.apache.druid.java.util.common.jackson.JacksonUtils;
-import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.java.util.common.parsers.ParseException;
-import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.java.util.emitter.core.NoopEmitter;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.java.util.metrics.MonitorScheduler;
-import org.apache.druid.math.expr.ExprMacroTable;
-import org.apache.druid.metadata.IndexerSQLMetadataStorageCoordinator;
-import org.apache.druid.metadata.MetadataStorageTablesConfig;
-import org.apache.druid.metadata.TestDerbyConnector;
-import org.apache.druid.query.DefaultQueryRunnerFactoryConglomerate;
-import org.apache.druid.query.DirectQueryProcessingPool;
-import org.apache.druid.query.Druids;
-import org.apache.druid.query.QueryPlus;
-import org.apache.druid.query.QueryRunnerFactoryConglomerate;
-import org.apache.druid.query.Result;
-import org.apache.druid.query.SegmentDescriptor;
-import org.apache.druid.query.aggregation.AggregatorFactory;
-import org.apache.druid.query.aggregation.CountAggregatorFactory;
-import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
-import org.apache.druid.query.filter.DimFilter;
-import org.apache.druid.query.filter.SelectorDimFilter;
-import org.apache.druid.query.timeseries.TimeseriesQuery;
-import org.apache.druid.query.timeseries.TimeseriesQueryEngine;
-import org.apache.druid.query.timeseries.TimeseriesQueryQueryToolChest;
-import org.apache.druid.query.timeseries.TimeseriesQueryRunnerFactory;
-import org.apache.druid.query.timeseries.TimeseriesResultValue;
-import org.apache.druid.segment.SegmentSchemaMapping;
-import org.apache.druid.segment.TestHelper;
-import org.apache.druid.segment.TestIndex;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
-import org.apache.druid.segment.incremental.RowIngestionMeters;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.apache.druid.segment.join.NoopJoinableFactory;
-import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.metadata.SegmentSchemaManager;
-import org.apache.druid.segment.realtime.firehose.NoopChatHandlerProvider;
-import org.apache.druid.segment.transform.ExpressionTransform;
-import org.apache.druid.segment.transform.TransformSpec;
-import org.apache.druid.server.DruidNode;
-import org.apache.druid.server.coordination.DataSegmentServerAnnouncer;
-import org.apache.druid.server.coordination.ServerType;
-import org.apache.druid.server.security.AuthTestUtils;
-import org.apache.druid.testing.InitializedNullHandlingTest;
-import org.apache.druid.timeline.DataSegment;
-import org.apache.druid.timeline.partition.LinearShardSpec;
-import org.apache.druid.timeline.partition.NumberedShardSpec;
-import org.easymock.EasyMock;
-import org.joda.time.DateTime;
-import org.joda.time.Period;
-import org.junit.After;
-import org.junit.Assert;
-import org.junit.Before;
-import org.junit.Rule;
-import org.junit.Test;
-import org.junit.rules.ExpectedException;
-import org.junit.rules.TemporaryFolder;
-
-import javax.annotation.Nullable;
-import java.io.File;
-import java.io.IOException;
-import java.nio.file.Files;
-import java.util.ArrayDeque;
-import java.util.Arrays;
-import java.util.Collection;
-import java.util.Deque;
-import java.util.List;
-import java.util.Map;
-import java.util.Optional;
-import java.util.Set;
-import java.util.concurrent.ConcurrentHashMap;
-import java.util.concurrent.CopyOnWriteArrayList;
-import java.util.concurrent.CountDownLatch;
-import java.util.concurrent.Executor;
-import java.util.concurrent.TimeUnit;
-import java.util.regex.Pattern;
-
-public class AppenderatorDriverRealtimeIndexTaskTest extends InitializedNullHandlingTest
-{
-  private static final Logger log = new Logger(AppenderatorDriverRealtimeIndexTaskTest.class);
-  private static final ServiceEmitter EMITTER = new ServiceEmitter(
-      "service",
-      "host",
-      new NoopEmitter()
-  );
-
-  private static final ObjectMapper OBJECT_MAPPER = TestHelper.makeJsonMapper();
-
-  private static final String FAIL_DIM = "__fail__";
-
-  private static class TestFirehose implements Firehose
-  {
-    private final InputRowParser<Map<String, Object>> parser;
-    private final Deque<Optional<Map<String, Object>>> queue = new ArrayDeque<>();
-    private boolean closed = false;
-
-    public TestFirehose(final InputRowParser<Map<String, Object>> parser)
-    {
-      this.parser = parser;
-    }
-
-    public void addRows(List<Map<String, Object>> rows)
-    {
-      synchronized (this) {
-        rows.stream().map(Optional::ofNullable).forEach(queue::add);
-        notifyAll();
-      }
-    }
-
-    @Override
-    public boolean hasMore()
-    {
-      try {
-        synchronized (this) {
-          while (queue.isEmpty() && !closed) {
-            wait();
-          }
-          return !queue.isEmpty();
-        }
-      }
-      catch (InterruptedException e) {
-        Thread.currentThread().interrupt();
-        throw new RuntimeException(e);
-      }
-    }
-
-    @Override
-    public InputRow nextRow()
-    {
-      synchronized (this) {
-        final InputRow row = parser.parseBatch(queue.removeFirst().orElse(null)).get(0);
-        if (row != null && row.getRaw(FAIL_DIM) != null) {
-          throw new ParseException(null, FAIL_DIM);
-        }
-        return row;
-      }
-    }
-
-    @Override
-    public void close()
-    {
-      synchronized (this) {
-        closed = true;
-        notifyAll();
-      }
-    }
-  }
-
-  private static class TestFirehoseFactory implements FirehoseFactory<InputRowParser>
-  {
-    public TestFirehoseFactory()
-    {
-    }
-
-    @Override
-    @SuppressWarnings("unchecked")
-    public Firehose connect(InputRowParser parser, File temporaryDirectory) throws ParseException
-    {
-      return new TestFirehose(parser);
-    }
-  }
-
-  @Rule
-  public final ExpectedException expectedException = ExpectedException.none();
-
-  @Rule
-  public final TemporaryFolder tempFolder = new TemporaryFolder();
-
-  @Rule
-  public final TestDerbyConnector.DerbyConnectorRule derbyConnectorRule = new TestDerbyConnector.DerbyConnectorRule();
-  private final ObjectMapper mapper = TestHelper.makeJsonMapper();
-
-  private DateTime now;
-  private ListeningExecutorService taskExec;
-  private Map<SegmentDescriptor, Pair<Executor, Runnable>> handOffCallbacks;
-  private Collection<DataSegment> publishedSegments;
-  private CountDownLatch segmentLatch;
-  private CountDownLatch handoffLatch;
-  private TaskStorage taskStorage;
-  private TaskLockbox taskLockbox;
-  private TaskToolboxFactory taskToolboxFactory;
-  private File baseDir;
-  private File reportsFile;
-  private SegmentSchemaManager segmentSchemaManager;
-
-  @Before
-  public void setUp() throws IOException
-  {
-    EmittingLogger.registerEmitter(EMITTER);
-    EMITTER.start();
-    taskExec = MoreExecutors.listeningDecorator(Execs.singleThreaded("realtime-index-task-test-%d"));
-    now = DateTimes.nowUtc();
-
-    TestDerbyConnector derbyConnector = derbyConnectorRule.getConnector();
-    derbyConnector.createDataSourceTable();
-    derbyConnector.createTaskTables();
-    derbyConnector.createSegmentSchemasTable();
-    derbyConnector.createSegmentTable();
-    derbyConnector.createPendingSegmentsTable();
-
-    baseDir = tempFolder.newFolder();
-    reportsFile = File.createTempFile("KafkaIndexTaskTestReports-" + System.currentTimeMillis(), "json");
-    makeToolboxFactory(baseDir);
-    segmentSchemaManager = new SegmentSchemaManager(MetadataStorageTablesConfig.fromBase(null), mapper, derbyConnector);
-  }
-
-  @After
-  public void tearDown()
-  {
-    taskExec.shutdownNow();
-    reportsFile.delete();
-  }
-
-  @Test(timeout = 60_000L)
-  public void testDefaultResource()
-  {
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(null);
-    Assert.assertEquals(task.getId(), task.getTaskResource().getAvailabilityGroup());
-  }
-
-
-  @Test(timeout = 60_000L)
-  public void testHandoffTimeout() throws Exception
-  {
-    expectPublishedSegments(1);
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(null, TransformSpec.NONE, true, 100L, true, 0, 1);
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        ImmutableList.of(
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1")
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // handoff would timeout, resulting in exception
-    TaskStatus status = statusFuture.get();
-    Assert.assertTrue(status.getErrorMsg()
-                            .contains("java.util.concurrent.TimeoutException: Waited 100 milliseconds"));
-  }
-
-  @Test(timeout = 60_000L)
-  public void testBasics() throws Exception
-  {
-    expectPublishedSegments(1);
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(null);
-    Assert.assertTrue(task.supportsQueries());
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        ImmutableList.of(
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1"),
-            ImmutableMap.of("t", now.getMillis(), "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    Collection<DataSegment> publishedSegments = awaitSegments();
-
-    // Check metrics.
-    Assert.assertEquals(2, task.getRowIngestionMeters().getProcessed());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getThrownAway());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getUnparseable());
-
-    // Do some queries.
-    Assert.assertEquals(2, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(3, sumMetric(task, null, "met1").longValue());
-
-    awaitHandoffs();
-
-    for (DataSegment publishedSegment : publishedSegments) {
-      Pair<Executor, Runnable> executorRunnablePair = handOffCallbacks.get(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          )
-      );
-      Assert.assertNotNull(
-          publishedSegment + " missing from handoff callbacks: " + handOffCallbacks,
-          executorRunnablePair
-      );
-
-      // Simulate handoff.
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testLateData() throws Exception
-  {
-    expectPublishedSegments(1);
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(null);
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        ImmutableList.of(
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1"),
-            // Data is from 2 days ago, should still be processed
-            ImmutableMap.of("t", now.minus(new Period("P2D")).getMillis(), "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    Collection<DataSegment> publishedSegments = awaitSegments();
-
-    // Check metrics.
-    Assert.assertEquals(2, task.getRowIngestionMeters().getProcessed());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getThrownAway());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getUnparseable());
-
-    // Do some queries.
-    Assert.assertEquals(2, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(3, sumMetric(task, null, "met1").longValue());
-
-    awaitHandoffs();
-
-    for (DataSegment publishedSegment : publishedSegments) {
-      Pair<Executor, Runnable> executorRunnablePair = handOffCallbacks.get(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          )
-      );
-      Assert.assertNotNull(
-          publishedSegment + " missing from handoff callbacks: " + handOffCallbacks,
-          executorRunnablePair
-      );
-
-      // Simulate handoff.
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testMaxRowsPerSegment() throws Exception
-  {
-    // Expect 2 segments as we will hit maxRowsPerSegment
-    expectPublishedSegments(2);
-
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(null);
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    // maxRowsPerSegment is 1000 as configured in #makeRealtimeTask
-    for (int i = 0; i < 2000; i++) {
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim1", "foo-" + i, "met1", "1")
-          )
-      );
-    }
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    Collection<DataSegment> publishedSegments = awaitSegments();
-
-    // Check metrics.
-    Assert.assertEquals(2000, task.getRowIngestionMeters().getProcessed());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getThrownAway());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getUnparseable());
-
-    // Do some queries.
-    Assert.assertEquals(2000, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(2000, sumMetric(task, null, "met1").longValue());
-
-    awaitHandoffs();
-
-    for (DataSegment publishedSegment : publishedSegments) {
-      Pair<Executor, Runnable> executorRunnablePair = handOffCallbacks.get(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          )
-      );
-      Assert.assertNotNull(
-          publishedSegment + " missing from handoff callbacks: " + handOffCallbacks,
-          executorRunnablePair
-      );
-
-      // Simulate handoff.
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testMaxTotalRows() throws Exception
-  {
-    // Expect 2 segments as we will hit maxTotalRows
-    expectPublishedSegments(2);
-
-    final AppenderatorDriverRealtimeIndexTask task =
-        makeRealtimeTask(null, Integer.MAX_VALUE, 1500L);
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    // maxTotalRows is 1500
-    for (int i = 0; i < 2000; i++) {
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim1", "foo-" + i, "met1", "1")
-          )
-      );
-    }
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    Collection<DataSegment> publishedSegments = awaitSegments();
-
-    // Check metrics.
-    Assert.assertEquals(2000, task.getRowIngestionMeters().getProcessed());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getThrownAway());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getUnparseable());
-
-    // Do some queries.
-    Assert.assertEquals(2000, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(2000, sumMetric(task, null, "met1").longValue());
-
-    awaitHandoffs();
-
-    Assert.assertEquals(2, publishedSegments.size());
-    for (DataSegment publishedSegment : publishedSegments) {
-      Pair<Executor, Runnable> executorRunnablePair = handOffCallbacks.get(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          )
-      );
-      Assert.assertNotNull(
-          publishedSegment + " missing from handoff callbacks: " + handOffCallbacks,
-          executorRunnablePair
-      );
-
-      // Simulate handoff.
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testTransformSpec() throws Exception
-  {
-    expectPublishedSegments(2);
-
-    final TransformSpec transformSpec = new TransformSpec(
-        new SelectorDimFilter("dim1", "foo", null),
-        ImmutableList.of(
-            new ExpressionTransform("dim1t", "concat(dim1,dim1)", ExprMacroTable.nil())
-        )
-    );
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(null, transformSpec, true, 0, true, 0, 1);
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        ImmutableList.of(
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1"),
-            ImmutableMap.of("t", now.minus(new Period("P1D")).getMillis(), "dim1", "foo", "met1", 2.0),
-            ImmutableMap.of("t", now.getMillis(), "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    Collection<DataSegment> publishedSegments = awaitSegments();
-
-    // Check metrics.
-    Assert.assertEquals(2, task.getRowIngestionMeters().getProcessed());
-    Assert.assertEquals(1, task.getRowIngestionMeters().getThrownAway());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getUnparseable());
-
-    // Do some queries.
-    Assert.assertEquals(2, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(2, sumMetric(task, new SelectorDimFilter("dim1t", "foofoo", null), "rows").longValue());
-    if (NullHandling.replaceWithDefault()) {
-      Assert.assertEquals(0, sumMetric(task, new SelectorDimFilter("dim1t", "barbar", null), "metric1").longValue());
-    } else {
-      Assert.assertNull(sumMetric(task, new SelectorDimFilter("dim1t", "barbar", null), "metric1"));
-    }
-    Assert.assertEquals(3, sumMetric(task, null, "met1").longValue());
-
-    awaitHandoffs();
-
-    for (DataSegment publishedSegment : publishedSegments) {
-      Pair<Executor, Runnable> executorRunnablePair = handOffCallbacks.get(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          )
-      );
-      Assert.assertNotNull(
-          publishedSegment + " missing from handoff callbacks: " + handOffCallbacks,
-          executorRunnablePair
-      );
-
-      // Simulate handoff.
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testReportParseExceptionsOnBadMetric() throws Exception
-  {
-    expectPublishedSegments(0);
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(null, true);
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        ImmutableList.of(
-            ImmutableMap.of("t", 2000000L, "dim1", "foo", "met1", "1"),
-            ImmutableMap.of("t", 3000000L, "dim1", "foo", "met1", "foo"),
-            ImmutableMap.of("t", now.minus(new Period("P1D")).getMillis(), "dim1", "foo", "met1", "foo"),
-            ImmutableMap.of("t", 4000000L, "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for the task to finish.
-    TaskStatus status = statusFuture.get();
-    Assert.assertTrue(status.getErrorMsg().contains("org.apache.druid.java.util.common.RE: Max parse exceptions[0] exceeded"));
-
-    IngestionStatsAndErrors reportData = getTaskReportData();
-
-    ParseExceptionReport parseExceptionReport =
-        ParseExceptionReport.forPhase(reportData, RowIngestionMeters.BUILD_SEGMENTS);
-    List<String> expectedMessages = ImmutableList.of(
-        "Unable to parse value[foo] for field[met1]"
-    );
-    Assert.assertEquals(expectedMessages, parseExceptionReport.getErrorMessages());
-
-    List<String> expectedInputs = ImmutableList.of(
-        "{t=3000000, dim1=foo, met1=foo}"
-    );
-    Assert.assertEquals(expectedInputs, parseExceptionReport.getInputs());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testNoReportParseExceptions() throws Exception
-  {
-    expectPublishedSegments(1);
-
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(
-        null,
-        TransformSpec.NONE,
-        false,
-        0,
-        true,
-        null,
-        1
-    );
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        Arrays.asList(
-            // Good row- will be processed.
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1"),
-
-            // Null row- will be thrown away.
-            null,
-
-            // Bad metric- will count as processed, but that particular metric won't update.
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "foo"),
-
-            // Bad row- will be unparseable.
-            ImmutableMap.of("dim1", "foo", "met1", 2.0, FAIL_DIM, "x"),
-
-            // Good row- will be processed.
-            ImmutableMap.of("t", now.getMillis(), "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    Collection<DataSegment> publishedSegments = awaitSegments();
-
-    DataSegment publishedSegment = Iterables.getOnlyElement(publishedSegments);
-
-    // Check metrics.
-    Assert.assertEquals(2, task.getRowIngestionMeters().getProcessed());
-    Assert.assertEquals(1, task.getRowIngestionMeters().getProcessedWithError());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getThrownAway());
-    Assert.assertEquals(2, task.getRowIngestionMeters().getUnparseable());
-
-    // Do some queries.
-    Assert.assertEquals(3, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(3, sumMetric(task, null, "met1").longValue());
-
-    awaitHandoffs();
-
-    // Simulate handoff.
-    for (Map.Entry<SegmentDescriptor, Pair<Executor, Runnable>> entry : handOffCallbacks.entrySet()) {
-      final Pair<Executor, Runnable> executorRunnablePair = entry.getValue();
-      Assert.assertEquals(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          ),
-          entry.getKey()
-      );
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    Map<String, Object> expectedMetrics = ImmutableMap.of(
-        RowIngestionMeters.BUILD_SEGMENTS,
-        ImmutableMap.of(
-            RowIngestionMeters.PROCESSED, 2,
-            RowIngestionMeters.PROCESSED_BYTES, 0,
-            RowIngestionMeters.PROCESSED_WITH_ERROR, 1,
-            RowIngestionMeters.UNPARSEABLE, 2,
-            RowIngestionMeters.THROWN_AWAY, 0
-        )
-    );
-
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-
-    IngestionStatsAndErrors reportData = getTaskReportData();
-
-    Assert.assertEquals(expectedMetrics, reportData.getRowStats());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testMultipleParseExceptionsSuccess() throws Exception
-  {
-    expectPublishedSegments(1);
-
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(null, TransformSpec.NONE, false, 0, true, 10, 10);
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        Arrays.asList(
-            // Good row- will be processed.
-            ImmutableMap.of("t", 1521251960729L, "dim1", "foo", "met1", "1"),
-
-            // Null row- will be thrown away.
-            null,
-
-            // Bad metric- will count as processed, but that particular metric won't update.
-            ImmutableMap.of("t", 1521251960729L, "dim1", "foo", "met1", "foo"),
-
-            // Bad long dim- will count as processed, but bad dims will get default values
-            ImmutableMap.of(
-                "t",
-                1521251960729L,
-                "dim1",
-                "foo",
-                "dimLong",
-                "notnumber",
-                "dimFloat",
-                "notnumber",
-                "met1",
-                "foo"
-            ),
-
-            // Bad row- will be unparseable.
-            ImmutableMap.of("dim1", "foo", "met1", 2.0, FAIL_DIM, "x"),
-
-            // Good row- will be processed.
-            ImmutableMap.of("t", 1521251960729L, "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    Collection<DataSegment> publishedSegments = awaitSegments();
-
-    DataSegment publishedSegment = Iterables.getOnlyElement(publishedSegments);
-
-    // Check metrics.
-    Assert.assertEquals(2, task.getRowIngestionMeters().getProcessed());
-    Assert.assertEquals(2, task.getRowIngestionMeters().getProcessedWithError());
-    Assert.assertEquals(0, task.getRowIngestionMeters().getThrownAway());
-    Assert.assertEquals(2, task.getRowIngestionMeters().getUnparseable());
-
-    // Do some queries.
-    Assert.assertEquals(4, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(3, sumMetric(task, null, "met1").longValue());
-
-    awaitHandoffs();
-
-    // Simulate handoff.
-    for (Map.Entry<SegmentDescriptor, Pair<Executor, Runnable>> entry : handOffCallbacks.entrySet()) {
-      final Pair<Executor, Runnable> executorRunnablePair = entry.getValue();
-      Assert.assertEquals(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          ),
-          entry.getKey()
-      );
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    Map<String, Object> expectedMetrics = ImmutableMap.of(
-        RowIngestionMeters.BUILD_SEGMENTS,
-        ImmutableMap.of(
-            RowIngestionMeters.PROCESSED, 2,
-            RowIngestionMeters.PROCESSED_BYTES, 0,
-            RowIngestionMeters.PROCESSED_WITH_ERROR, 2,
-            RowIngestionMeters.UNPARSEABLE, 2,
-            RowIngestionMeters.THROWN_AWAY, 0
-        )
-    );
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-
-    IngestionStatsAndErrors reportData = getTaskReportData();
-    Assert.assertEquals(expectedMetrics, reportData.getRowStats());
-
-    ParseExceptionReport parseExceptionReport =
-        ParseExceptionReport.forPhase(reportData, RowIngestionMeters.BUILD_SEGMENTS);
-
-    List<String> expectedMessages = Arrays.asList(
-        "Timestamp[null] is unparseable! Event: {dim1=foo, met1=2.0, __fail__=x}",
-        "could not convert value [notnumber] to long",
-        "Unable to parse value[foo] for field[met1]",
-        "Timestamp[null] is unparseable! Event: null"
-    );
-    Assert.assertEquals(expectedMessages, parseExceptionReport.getErrorMessages());
-
-    List<String> expectedInputs = Arrays.asList(
-        "{dim1=foo, met1=2.0, __fail__=x}",
-        "{t=1521251960729, dim1=foo, dimLong=notnumber, dimFloat=notnumber, met1=foo}",
-        "{t=1521251960729, dim1=foo, met1=foo}",
-        null
-    );
-    Assert.assertEquals(expectedInputs, parseExceptionReport.getInputs());
-    Assert.assertEquals(IngestionState.COMPLETED, reportData.getIngestionState());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testMultipleParseExceptionsFailure() throws Exception
-  {
-    expectPublishedSegments(1);
-
-    final AppenderatorDriverRealtimeIndexTask task = makeRealtimeTask(null, TransformSpec.NONE, false, 0, true, 3, 10);
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        Arrays.asList(
-            // Good row- will be processed.
-            ImmutableMap.of("t", 1521251960729L, "dim1", "foo", "met1", "1"),
-
-            // Null row- will be thrown away.
-            null,
-
-            // Bad metric- will count as processed, but that particular metric won't update.
-            ImmutableMap.of("t", 1521251960729L, "dim1", "foo", "met1", "foo"),
-
-            // Bad long dim- will count as processed, but bad dims will get default values
-            ImmutableMap.of(
-                "t",
-                1521251960729L,
-                "dim1",
-                "foo",
-                "dimLong",
-                "notnumber",
-                "dimFloat",
-                "notnumber",
-                "met1",
-                "foo"
-            ),
-
-            // Bad row- will be unparseable.
-            ImmutableMap.of("dim1", "foo", "met1", 2.0, FAIL_DIM, "x"),
-
-            // Good row- will be processed.
-            ImmutableMap.of("t", 1521251960729L, "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.FAILED, taskStatus.getStatusCode());
-    Assert.assertTrue(taskStatus.getErrorMsg().contains("Max parse exceptions[3] exceeded"));
-
-    IngestionStatsAndErrors reportData = getTaskReportData();
-
-    Map<String, Object> expectedMetrics = ImmutableMap.of(
-        RowIngestionMeters.BUILD_SEGMENTS,
-        ImmutableMap.of(
-            RowIngestionMeters.PROCESSED, 1,
-            RowIngestionMeters.PROCESSED_BYTES, 0,
-            RowIngestionMeters.PROCESSED_WITH_ERROR, 2,
-            RowIngestionMeters.UNPARSEABLE, 2,
-            RowIngestionMeters.THROWN_AWAY, 0
-        )
-    );
-    Assert.assertEquals(expectedMetrics, reportData.getRowStats());
-
-    ParseExceptionReport parseExceptionReport =
-        ParseExceptionReport.forPhase(reportData, RowIngestionMeters.BUILD_SEGMENTS);
-
-    List<String> expectedMessages = ImmutableList.of(
-        "Timestamp[null] is unparseable! Event: {dim1=foo, met1=2.0, __fail__=x}",
-        "could not convert value [notnumber] to long",
-        "Unable to parse value[foo] for field[met1]",
-        "Timestamp[null] is unparseable! Event: null"
-    );
-    Assert.assertEquals(expectedMessages, parseExceptionReport.getErrorMessages());
-
-    List<String> expectedInputs = Arrays.asList(
-        "{dim1=foo, met1=2.0, __fail__=x}",
-        "{t=1521251960729, dim1=foo, dimLong=notnumber, dimFloat=notnumber, met1=foo}",
-        "{t=1521251960729, dim1=foo, met1=foo}",
-        null
-    );
-    Assert.assertEquals(expectedInputs, parseExceptionReport.getInputs());
-    Assert.assertEquals(IngestionState.BUILD_SEGMENTS, reportData.getIngestionState());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testRestore() throws Exception
-  {
-    expectPublishedSegments(0);
-
-    final AppenderatorDriverRealtimeIndexTask task1 = makeRealtimeTask(null);
-    final DataSegment publishedSegment;
-
-    // First run:
-    {
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task1);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task1.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      final TestFirehose firehose = (TestFirehose) task1.getFirehose();
-
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim1", "foo")
-          )
-      );
-
-      // Trigger graceful shutdown.
-      task1.stopGracefully(taskToolboxFactory.build(task1).getConfig());
-
-      // Wait for the task to finish. The status doesn't really matter, but we'll check it anyway.
-      final TaskStatus taskStatus = statusFuture.get();
-      Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-
-      // Nothing should be published.
-      Assert.assertTrue(publishedSegments.isEmpty());
-    }
-
-    // Second run:
-    {
-      expectPublishedSegments(1);
-      final AppenderatorDriverRealtimeIndexTask task2 = makeRealtimeTask(task1.getId());
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task2);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task2.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      // Do a query, at this point the previous data should be loaded.
-      Assert.assertEquals(1, sumMetric(task2, null, "rows").longValue());
-
-      final TestFirehose firehose = (TestFirehose) task2.getFirehose();
-
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim2", "bar")
-          )
-      );
-
-      // Stop the firehose, this will drain out existing events.
-      firehose.close();
-
-      Collection<DataSegment> publishedSegments = awaitSegments();
-
-      publishedSegment = Iterables.getOnlyElement(publishedSegments);
-
-      // Do a query.
-      Assert.assertEquals(2, sumMetric(task2, null, "rows").longValue());
-
-      awaitHandoffs();
-
-      // Simulate handoff.
-      for (Map.Entry<SegmentDescriptor, Pair<Executor, Runnable>> entry : handOffCallbacks.entrySet()) {
-        final Pair<Executor, Runnable> executorRunnablePair = entry.getValue();
-        Assert.assertEquals(
-            new SegmentDescriptor(
-                publishedSegment.getInterval(),
-                publishedSegment.getVersion(),
-                publishedSegment.getShardSpec().getPartitionNum()
-            ),
-            entry.getKey()
-        );
-        executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-      }
-      handOffCallbacks.clear();
-
-      // Wait for the task to finish.
-      final TaskStatus taskStatus = statusFuture.get();
-      Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-    }
-  }
-
-  @Test(timeout = 60_000L)
-  public void testRestoreAfterHandoffAttemptDuringShutdown() throws Exception
-  {
-    final AppenderatorDriverRealtimeIndexTask task1 = makeRealtimeTask(null);
-    final DataSegment publishedSegment;
-
-    // First run:
-    {
-      expectPublishedSegments(1);
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task1);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task1.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      final TestFirehose firehose = (TestFirehose) task1.getFirehose();
-
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim1", "foo")
-          )
-      );
-
-      // Stop the firehose, this will trigger a finishJob.
-      firehose.close();
-
-      Collection<DataSegment> publishedSegments = awaitSegments();
-
-      publishedSegment = Iterables.getOnlyElement(publishedSegments);
-
-      // Do a query.
-      Assert.assertEquals(1, sumMetric(task1, null, "rows").longValue());
-
-      // Trigger graceful shutdown.
-      task1.stopGracefully(taskToolboxFactory.build(task1).getConfig());
-
-      // Wait for the task to finish. The status doesn't really matter.
-      while (!statusFuture.isDone()) {
-        Thread.sleep(50);
-      }
-    }
-
-    // Second run:
-    {
-      expectPublishedSegments(1);
-      final AppenderatorDriverRealtimeIndexTask task2 = makeRealtimeTask(task1.getId());
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task2);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task2.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      // Stop the firehose again, this will start another handoff.
-      final TestFirehose firehose = (TestFirehose) task2.getFirehose();
-
-      // Stop the firehose, this will trigger a finishJob.
-      firehose.close();
-
-      awaitHandoffs();
-
-      // Simulate handoff.
-      for (Map.Entry<SegmentDescriptor, Pair<Executor, Runnable>> entry : handOffCallbacks.entrySet()) {
-        final Pair<Executor, Runnable> executorRunnablePair = entry.getValue();
-        Assert.assertEquals(
-            new SegmentDescriptor(
-                publishedSegment.getInterval(),
-                publishedSegment.getVersion(),
-                publishedSegment.getShardSpec().getPartitionNum()
-            ),
-            entry.getKey()
-        );
-        executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-      }
-      handOffCallbacks.clear();
-
-      // Wait for the task to finish.
-      final TaskStatus taskStatus = statusFuture.get();
-      Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-    }
-  }
-
-  @Test(timeout = 60_000L)
-  public void testRestoreCorruptData() throws Exception
-  {
-    final AppenderatorDriverRealtimeIndexTask task1 = makeRealtimeTask(null);
-
-    // First run:
-    {
-      expectPublishedSegments(0);
-
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task1);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task1.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      final TestFirehose firehose = (TestFirehose) task1.getFirehose();
-
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim1", "foo")
-          )
-      );
-
-      // Trigger graceful shutdown.
-      task1.stopGracefully(taskToolboxFactory.build(task1).getConfig());
-
-      // Wait for the task to finish. The status doesn't really matter, but we'll check it anyway.
-      final TaskStatus taskStatus = statusFuture.get();
-      Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-
-      // Nothing should be published.
-      Assert.assertTrue(publishedSegments.isEmpty());
-    }
-
-    Optional<File> optional = FileUtils.listFiles(baseDir, null, true).stream()
-                                       .filter(f -> f.getName().equals("00000.smoosh"))
-                                       .findFirst();
-
-    Assert.assertTrue("Could not find smoosh file", optional.isPresent());
-
-    // Corrupt the data:
-    final File smooshFile = optional.get();
-
-    Files.write(smooshFile.toPath(), StringUtils.toUtf8("oops!"));
-
-    // Second run:
-    {
-      expectPublishedSegments(0);
-
-      final AppenderatorDriverRealtimeIndexTask task2 = makeRealtimeTask(task1.getId());
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task2);
-
-      // Wait for the task to finish.
-      TaskStatus status = statusFuture.get();
-
-      Map<String, Object> expectedMetrics = ImmutableMap.of(
-          RowIngestionMeters.BUILD_SEGMENTS,
-          ImmutableMap.of(
-              RowIngestionMeters.PROCESSED_WITH_ERROR, 0,
-              RowIngestionMeters.PROCESSED, 0,
-              RowIngestionMeters.PROCESSED_BYTES, 0,
-              RowIngestionMeters.UNPARSEABLE, 0,
-              RowIngestionMeters.THROWN_AWAY, 0
-          )
-      );
-
-      IngestionStatsAndErrors reportData = getTaskReportData();
-      Assert.assertEquals(expectedMetrics, reportData.getRowStats());
-
-      Pattern errorPattern = Pattern.compile(
-          "(?s)java\\.lang\\.IllegalArgumentException.*\n"
-          + "\tat (java\\.base/)?java\\.nio\\.Buffer\\..*"
-      );
-      Assert.assertTrue(errorPattern.matcher(status.getErrorMsg()).matches());
-    }
-  }
-
-  @Test(timeout = 60_000L)
-  public void testStopBeforeStarting() throws Exception
-  {
-    expectPublishedSegments(0);
-
-    final AppenderatorDriverRealtimeIndexTask task1 = makeRealtimeTask(null);
-
-    task1.stopGracefully(taskToolboxFactory.build(task1).getConfig());
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task1);
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testInputSourceResourcesThrowException()
-  {
-    // Expect 2 segments as we will hit maxTotalRows
-    expectPublishedSegments(2);
-
-    final AppenderatorDriverRealtimeIndexTask task =
-        makeRealtimeTask(null, Integer.MAX_VALUE, 1500L);
-    Assert.assertThrows(
-        UOE.class,
-        task::getInputSourceResources
-    );
-  }
-
-  private ListenableFuture<TaskStatus> runTask(final Task task)
-  {
-    try {
-      taskStorage.insert(task, TaskStatus.running(task.getId()));
-    }
-    catch (DruidException e) {
-      log.noStackTrace().info(e, "Suppressing exception while inserting task [%s]", task.getId());
-    }
-    taskLockbox.syncFromStorage();
-    final TaskToolbox toolbox = taskToolboxFactory.build(task);
-    return taskExec.submit(
-        () -> {
-          try {
-            if (task.isReady(toolbox.getTaskActionClient())) {
-              return task.run(toolbox);
-            } else {
-              throw new ISE("Task is not ready");
-            }
-          }
-          catch (Exception e) {
-            log.warn(e, "Task failed");
-            throw e;
-          }
-        }
-    );
-  }
-
-  private AppenderatorDriverRealtimeIndexTask makeRealtimeTask(final String taskId)
-  {
-    return makeRealtimeTask(
-        taskId,
-        TransformSpec.NONE,
-        true,
-        0,
-        true,
-        0,
-        1
-    );
-  }
-
-  private AppenderatorDriverRealtimeIndexTask makeRealtimeTask(
-      final String taskId,
-      final Integer maxRowsPerSegment,
-      final Long maxTotalRows
-  )
-  {
-    return makeRealtimeTask(
-        taskId,
-        TransformSpec.NONE,
-        true,
-        0,
-        true,
-        0,
-        1,
-        maxRowsPerSegment,
-        maxTotalRows
-    );
-  }
-
-  private AppenderatorDriverRealtimeIndexTask makeRealtimeTask(final String taskId, boolean reportParseExceptions)
-  {
-    return makeRealtimeTask(
-        taskId,
-        TransformSpec.NONE,
-        reportParseExceptions,
-        0,
-        true,
-        null,
-        1
-    );
-  }
-
-  private AppenderatorDriverRealtimeIndexTask makeRealtimeTask(
-      final String taskId,
-      final TransformSpec transformSpec,
-      final boolean reportParseExceptions,
-      final long handoffTimeout,
-      final Boolean logParseExceptions,
-      final Integer maxParseExceptions,
-      final Integer maxSavedParseExceptions
-  )
-  {
-
-    return makeRealtimeTask(
-        taskId,
-        transformSpec,
-        reportParseExceptions,
-        handoffTimeout,
-        logParseExceptions,
-        maxParseExceptions,
-        maxSavedParseExceptions,
-        1000,
-        null
-    );
-  }
-
-  private AppenderatorDriverRealtimeIndexTask makeRealtimeTask(
-      final String taskId,
-      final TransformSpec transformSpec,
-      final boolean reportParseExceptions,
-      final long handoffTimeout,
-      final Boolean logParseExceptions,
-      final Integer maxParseExceptions,
-      final Integer maxSavedParseExceptions,
-      final Integer maxRowsPerSegment,
-      final Long maxTotalRows
-  )
-  {
-    DataSchema dataSchema = new DataSchema(
-        "test_ds",
-        TestHelper.makeJsonMapper().convertValue(
-            new MapInputRowParser(
-                new TimeAndDimsParseSpec(
-                    new TimestampSpec("t", "auto", null),
-                    new DimensionsSpec(
-                        ImmutableList.of(
-                            new StringDimensionSchema("dim1"),
-                            new StringDimensionSchema("dim2"),
-                            new StringDimensionSchema("dim1t"),
-                            new LongDimensionSchema("dimLong"),
-                            new FloatDimensionSchema("dimFloat")
-                        )
-                    )
-                )
-            ),
-            JacksonUtils.TYPE_REFERENCE_MAP_STRING_OBJECT
-        ),
-        new AggregatorFactory[]{new CountAggregatorFactory("rows"), new LongSumAggregatorFactory("met1", "met1")},
-        new UniformGranularitySpec(Granularities.DAY, Granularities.NONE, null),
-        transformSpec,
-        OBJECT_MAPPER
-    );
-    RealtimeIOConfig realtimeIOConfig = new RealtimeIOConfig(
-        new TestFirehoseFactory(),
-        null
-    );
-    RealtimeAppenderatorTuningConfig tuningConfig = new RealtimeAppenderatorTuningConfig(
-        null,
-        1000,
-        null,
-        null,
-        maxRowsPerSegment,
-        maxTotalRows,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        reportParseExceptions,
-        handoffTimeout,
-        null,
-        null,
-        logParseExceptions,
-        maxParseExceptions,
-        maxSavedParseExceptions,
-        null
-    );
-    return new AppenderatorDriverRealtimeIndexTask(
-        taskId,
-        null,
-        new RealtimeAppenderatorIngestionSpec(dataSchema, realtimeIOConfig, tuningConfig),
-        null
-    )
-    {
-      @Override
-      protected boolean isFirehoseDrainableByClosing(FirehoseFactory firehoseFactory)
-      {
-        return true;
-      }
-    };
-  }
-
-  private void expectPublishedSegments(int count)
-  {
-    segmentLatch = new CountDownLatch(count);
-    handoffLatch = new CountDownLatch(count);
-  }
-
-  private Collection<DataSegment> awaitSegments() throws InterruptedException
-  {
-    Assert.assertTrue(
-        "Timed out waiting for segments to be published",
-        segmentLatch.await(1, TimeUnit.MINUTES)
-    );
-
-    return publishedSegments;
-  }
-
-  private void awaitHandoffs() throws InterruptedException
-  {
-    Assert.assertTrue(
-        "Timed out waiting for segments to be handed off",
-        handoffLatch.await(1, TimeUnit.MINUTES)
-    );
-  }
-
-  private void makeToolboxFactory(final File directory)
-  {
-    taskStorage = new HeapMemoryTaskStorage(new TaskStorageConfig(null));
-    publishedSegments = new CopyOnWriteArrayList<>();
-
-    ObjectMapper mapper = new DefaultObjectMapper();
-    mapper.registerSubtypes(LinearShardSpec.class);
-    mapper.registerSubtypes(NumberedShardSpec.class);
-    IndexerSQLMetadataStorageCoordinator mdc = new IndexerSQLMetadataStorageCoordinator(
-        mapper,
-        derbyConnectorRule.metadataTablesConfigSupplier().get(),
-        derbyConnectorRule.getConnector(),
-        segmentSchemaManager,
-        CentralizedDatasourceSchemaConfig.create()
-    )
-    {
-      @Override
-      public Set<DataSegment> commitSegments(Set<DataSegment> segments, SegmentSchemaMapping segmentSchemaMapping) throws IOException
-      {
-        Set<DataSegment> result = super.commitSegments(segments, segmentSchemaMapping);
-
-        Assert.assertFalse(
-            "Segment latch not initialized, did you forget to call expectPublishSegments?",
-            segmentLatch == null
-        );
-
-        publishedSegments.addAll(result);
-        segments.forEach(s -> segmentLatch.countDown());
-
-        return result;
-      }
-
-      @Override
-      public SegmentPublishResult commitSegmentsAndMetadata(
-          Set<DataSegment> segments,
-          DataSourceMetadata startMetadata,
-          DataSourceMetadata endMetadata,
-          SegmentSchemaMapping segmentSchemaMapping
-      ) throws IOException
-      {
-        SegmentPublishResult result = super.commitSegmentsAndMetadata(segments, startMetadata, endMetadata, segmentSchemaMapping);
-
-        Assert.assertNotNull(
-            "Segment latch not initialized, did you forget to call expectPublishSegments?",
-            segmentLatch
-        );
-
-        publishedSegments.addAll(result.getSegments());
-        result.getSegments().forEach(s -> segmentLatch.countDown());
-
-        return result;
-      }
-    };
-
-    taskLockbox = new TaskLockbox(taskStorage, mdc);
-    final TaskConfig taskConfig = new TaskConfigBuilder()
-        .setBaseDir(directory.getPath())
-        .setDefaultRowFlushBoundary(50000)
-        .setRestoreTasksOnRestart(true)
-        .setBatchProcessingMode(TaskConfig.BATCH_PROCESSING_MODE_DEFAULT.name())
-        .build();
-
-    final TaskActionToolbox taskActionToolbox = new TaskActionToolbox(
-        taskLockbox,
-        taskStorage,
-        mdc,
-        EMITTER,
-        EasyMock.createMock(SupervisorManager.class),
-        OBJECT_MAPPER
-    );
-
-    final TaskActionClientFactory taskActionClientFactory = new LocalTaskActionClientFactory(
-        taskStorage,
-        taskActionToolbox,
-        new TaskAuditLogConfig(false)
-    );
-
-    final QueryRunnerFactoryConglomerate conglomerate = new DefaultQueryRunnerFactoryConglomerate(
-        ImmutableMap.of(
-            TimeseriesQuery.class,
-            new TimeseriesQueryRunnerFactory(
-                new TimeseriesQueryQueryToolChest(),
-                new TimeseriesQueryEngine(),
-                (query, future) -> {
-                  // do nothing
-                }
-            )
-        )
-    );
-
-    handOffCallbacks = new ConcurrentHashMap<>();
-    final SegmentHandoffNotifierFactory handoffNotifierFactory = dataSource -> new SegmentHandoffNotifier()
-    {
-      @Override
-      public boolean registerSegmentHandoffCallback(
-          SegmentDescriptor descriptor,
-          Executor exec,
-          Runnable handOffRunnable
-      )
-      {
-        handOffCallbacks.put(descriptor, new Pair<>(exec, handOffRunnable));
-        handoffLatch.countDown();
-        return true;
-      }
-
-      @Override
-      public void start()
-      {
-        //Noop
-      }
-
-      @Override
-      public void close()
-      {
-        //Noop
-      }
-
-    };
-    final TestUtils testUtils = new TestUtils();
-    taskToolboxFactory = new TaskToolboxFactory(
-        null,
-        taskConfig,
-        new DruidNode("druid/middlemanager", "localhost", false, 8091, null, true, false),
-        taskActionClientFactory,
-        EMITTER,
-        new TestDataSegmentPusher(),
-        new TestDataSegmentKiller(),
-        null, // DataSegmentMover
-        null, // DataSegmentArchiver
-        new TestDataSegmentAnnouncer(),
-        EasyMock.createNiceMock(DataSegmentServerAnnouncer.class),
-        handoffNotifierFactory,
-        () -> conglomerate,
-        DirectQueryProcessingPool.INSTANCE, // queryExecutorService
-        NoopJoinableFactory.INSTANCE,
-        () -> EasyMock.createMock(MonitorScheduler.class),
-        new SegmentCacheManagerFactory(TestIndex.INDEX_IO, testUtils.getTestObjectMapper()),
-        testUtils.getTestObjectMapper(),
-        testUtils.getTestIndexIO(),
-        MapCache.create(1024),
-        new CacheConfig(),
-        new CachePopulatorStats(),
-        testUtils.getIndexMergerV9Factory(),
-        EasyMock.createNiceMock(DruidNodeAnnouncer.class),
-        EasyMock.createNiceMock(DruidNode.class),
-        new LookupNodeService("tier"),
-        new DataNodeService("tier", 1000, ServerType.INDEXER_EXECUTOR, 0),
-        new SingleFileTaskReportFileWriter(reportsFile),
-        null,
-        AuthTestUtils.TEST_AUTHORIZER_MAPPER,
-        new NoopChatHandlerProvider(),
-        testUtils.getRowIngestionMetersFactory(),
-        new TestAppenderatorsManager(),
-        new NoopOverlordClient(),
-        new NoopCoordinatorClient(),
-        null,
-        null,
-        null,
-        "1",
-        CentralizedDatasourceSchemaConfig.create()
-    );
-  }
-
-  @Nullable
-  public Long sumMetric(final Task task, final DimFilter filter, final String metric)
-  {
-    // Do a query.
-    TimeseriesQuery query = Druids.newTimeseriesQueryBuilder()
-                                  .dataSource("test_ds")
-                                  .filters(filter)
-                                  .aggregators(
-                                      ImmutableList.of(
-                                          new LongSumAggregatorFactory(metric, metric)
-                                      )
-                                  ).granularity(Granularities.ALL)
-                                  .intervals("2000/3000")
-                                  .build();
-
-    List<Result<TimeseriesResultValue>> results =
-        task.getQueryRunner(query).run(QueryPlus.wrap(query)).toList();
-
-    if (results.isEmpty()) {
-      return 0L;
-    } else {
-      return results.get(0).getValue().getLongMetric(metric);
-    }
-  }
-
-  private IngestionStatsAndErrors getTaskReportData() throws IOException
-  {
-    TaskReport.ReportMap taskReports = OBJECT_MAPPER.readValue(
-        reportsFile,
-        new TypeReference<TaskReport.ReportMap>()
-        {
-        }
-    );
-    return IngestionStatsAndErrors.getPayloadFromTaskReports(
-        taskReports
-    );
-  }
-}
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/AppenderatorsTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/AppenderatorsTest.java
deleted file mode 100644
index 12f82b84a2a..00000000000
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/AppenderatorsTest.java
+++ /dev/null
@@ -1,553 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.indexing.common.task;
-
-import com.fasterxml.jackson.databind.ObjectMapper;
-import org.apache.druid.data.input.impl.DimensionsSpec;
-import org.apache.druid.data.input.impl.JSONParseSpec;
-import org.apache.druid.data.input.impl.MapInputRowParser;
-import org.apache.druid.data.input.impl.TimestampSpec;
-import org.apache.druid.indexer.partitions.PartitionsSpec;
-import org.apache.druid.jackson.DefaultObjectMapper;
-import org.apache.druid.java.util.common.FileUtils;
-import org.apache.druid.java.util.common.granularity.Granularities;
-import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.java.util.emitter.core.NoopEmitter;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.query.aggregation.AggregatorFactory;
-import org.apache.druid.query.aggregation.CountAggregatorFactory;
-import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
-import org.apache.druid.segment.IndexIO;
-import org.apache.druid.segment.IndexMerger;
-import org.apache.druid.segment.IndexMergerV9;
-import org.apache.druid.segment.IndexSpec;
-import org.apache.druid.segment.column.ColumnConfig;
-import org.apache.druid.segment.incremental.AppendableIndexSpec;
-import org.apache.druid.segment.incremental.ParseExceptionHandler;
-import org.apache.druid.segment.incremental.RowIngestionMeters;
-import org.apache.druid.segment.incremental.SimpleRowIngestionMeters;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.TuningConfig;
-import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.apache.druid.segment.loading.DataSegmentPusher;
-import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.segment.realtime.appenderator.Appenderator;
-import org.apache.druid.segment.realtime.appenderator.AppenderatorConfig;
-import org.apache.druid.segment.realtime.appenderator.AppenderatorImpl;
-import org.apache.druid.segment.realtime.appenderator.Appenderators;
-import org.apache.druid.segment.realtime.appenderator.BatchAppenderator;
-import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
-import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
-import org.apache.druid.timeline.DataSegment;
-import org.apache.druid.timeline.partition.LinearShardSpec;
-import org.joda.time.Period;
-import org.junit.Assert;
-import org.junit.Test;
-
-import javax.annotation.Nullable;
-import java.io.File;
-import java.io.IOException;
-import java.net.URI;
-import java.util.List;
-import java.util.Map;
-import java.util.Objects;
-import java.util.concurrent.CopyOnWriteArrayList;
-
-
-public class AppenderatorsTest
-{
-  @Test
-  public void testOpenSegmentsOfflineAppenderator() throws Exception
-  {
-    try (final AppenderatorTester tester = new AppenderatorTester("OPEN_SEGMENTS")) {
-      Assert.assertTrue(tester.appenderator instanceof AppenderatorImpl);
-      AppenderatorImpl appenderator = (AppenderatorImpl) tester.appenderator;
-      Assert.assertTrue(appenderator.isOpenSegments());
-    }
-  }
-
-  @Test
-  public void testClosedSegmentsOfflineAppenderator() throws Exception
-  {
-    try (final AppenderatorTester tester = new AppenderatorTester("CLOSED_SEGMENTS")) {
-      Assert.assertTrue(tester.appenderator instanceof AppenderatorImpl);
-      AppenderatorImpl appenderator = (AppenderatorImpl) tester.appenderator;
-      Assert.assertFalse(appenderator.isOpenSegments());
-    }
-  }
-
-  @Test
-  public void testClosedSegmentsSinksOfflineAppenderator() throws Exception
-  {
-    try (final AppenderatorTester tester = new AppenderatorTester("CLOSED_SEGMENTS_SINKS")) {
-      Assert.assertTrue(tester.appenderator instanceof BatchAppenderator);
-    }
-  }
-
-
-  private static class AppenderatorTester implements AutoCloseable
-  {
-    public static final String DATASOURCE = "foo";
-
-    private final DataSchema schema;
-    private final AppenderatorConfig tuningConfig;
-    private final FireDepartmentMetrics metrics;
-    private final ObjectMapper objectMapper;
-    private final Appenderator appenderator;
-    private final ServiceEmitter emitter;
-
-    private final List<DataSegment> pushedSegments = new CopyOnWriteArrayList<>();
-
-
-    public AppenderatorTester(
-        final String batchMode
-    )
-    {
-      this(100, 100, null, false, new SimpleRowIngestionMeters(),
-           false, batchMode
-      );
-    }
-
-    public AppenderatorTester(
-        final int maxRowsInMemory,
-        final long maxSizeInBytes,
-        @Nullable final File basePersistDirectory,
-        final boolean enablePushFailure,
-        final RowIngestionMeters rowIngestionMeters,
-        final boolean skipBytesInMemoryOverheadCheck,
-        String batchMode
-    )
-    {
-      objectMapper = new DefaultObjectMapper();
-      objectMapper.registerSubtypes(LinearShardSpec.class);
-
-      final Map<String, Object> parserMap = objectMapper.convertValue(
-          new MapInputRowParser(
-              new JSONParseSpec(
-                  new TimestampSpec("ts", "auto", null),
-                  DimensionsSpec.EMPTY,
-                  null,
-                  null,
-                  null
-              )
-          ),
-          Map.class
-      );
-
-      schema = new DataSchema(
-          DATASOURCE,
-          null,
-          null,
-          new AggregatorFactory[]{
-              new CountAggregatorFactory("count"),
-              new LongSumAggregatorFactory("met", "met")
-          },
-          new UniformGranularitySpec(Granularities.MINUTE, Granularities.NONE, null),
-          null,
-          parserMap,
-          objectMapper
-      );
-
-      tuningConfig = new TestIndexTuningConfig(
-          TuningConfig.DEFAULT_APPENDABLE_INDEX,
-          maxRowsInMemory,
-          maxSizeInBytes == 0L ? getDefaultMaxBytesInMemory() : maxSizeInBytes,
-          skipBytesInMemoryOverheadCheck,
-          IndexSpec.DEFAULT,
-          0,
-          false,
-          0L,
-          OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-          IndexMerger.UNLIMITED_MAX_COLUMNS_TO_MERGE,
-          basePersistDirectory == null ? createNewBasePersistDirectory() : basePersistDirectory,
-          null
-      );
-      metrics = new FireDepartmentMetrics();
-
-      IndexIO indexIO = new IndexIO(objectMapper, ColumnConfig.DEFAULT);
-      IndexMergerV9 indexMerger = new IndexMergerV9(
-          objectMapper,
-          indexIO,
-          OffHeapMemorySegmentWriteOutMediumFactory.instance()
-      );
-
-      emitter = new ServiceEmitter(
-          "test",
-          "test",
-          new NoopEmitter()
-      );
-      emitter.start();
-      EmittingLogger.registerEmitter(emitter);
-      DataSegmentPusher dataSegmentPusher = new DataSegmentPusher()
-      {
-        private boolean mustFail = true;
-
-        @Deprecated
-        @Override
-        public String getPathForHadoop(String dataSource)
-        {
-          return getPathForHadoop();
-        }
-
-        @Override
-        public String getPathForHadoop()
-        {
-          throw new UnsupportedOperationException();
-        }
-
-        @Override
-        public DataSegment push(File file, DataSegment segment, boolean useUniquePath) throws IOException
-        {
-          if (enablePushFailure && mustFail) {
-            mustFail = false;
-            throw new IOException("Push failure test");
-          } else if (enablePushFailure) {
-            mustFail = true;
-          }
-          pushedSegments.add(segment);
-          return segment;
-        }
-
-        @Override
-        public Map<String, Object> makeLoadSpec(URI uri)
-        {
-          throw new UnsupportedOperationException();
-        }
-      };
-
-      switch (batchMode) {
-        case "OPEN_SEGMENTS":
-          appenderator = Appenderators.createOpenSegmentsOffline(
-              schema.getDataSource(),
-              schema,
-              tuningConfig,
-              metrics,
-              dataSegmentPusher,
-              objectMapper,
-              indexIO,
-              indexMerger,
-              rowIngestionMeters,
-              new ParseExceptionHandler(rowIngestionMeters, false, Integer.MAX_VALUE, 0),
-              false,
-              CentralizedDatasourceSchemaConfig.create()
-          );
-          break;
-        case "CLOSED_SEGMENTS":
-          appenderator = Appenderators.createClosedSegmentsOffline(
-              schema.getDataSource(),
-              schema,
-              tuningConfig,
-              metrics,
-              dataSegmentPusher,
-              objectMapper,
-              indexIO,
-              indexMerger,
-              rowIngestionMeters,
-              new ParseExceptionHandler(rowIngestionMeters, false, Integer.MAX_VALUE, 0),
-              false,
-              CentralizedDatasourceSchemaConfig.create()
-          );
-
-          break;
-        case "CLOSED_SEGMENTS_SINKS":
-          appenderator = Appenderators.createOffline(
-              schema.getDataSource(),
-              schema,
-              tuningConfig,
-              metrics,
-              dataSegmentPusher,
-              objectMapper,
-              indexIO,
-              indexMerger,
-              rowIngestionMeters,
-              new ParseExceptionHandler(rowIngestionMeters, false, Integer.MAX_VALUE, 0),
-              false,
-              CentralizedDatasourceSchemaConfig.create()
-          );
-          break;
-        default:
-          throw new IllegalArgumentException("Unrecognized batchMode: " + batchMode);
-      }
-    }
-
-    private long getDefaultMaxBytesInMemory()
-    {
-      return (Runtime.getRuntime().totalMemory()) / 3;
-    }
-
-    public DataSchema getSchema()
-    {
-      return schema;
-    }
-
-    public AppenderatorConfig getTuningConfig()
-    {
-      return tuningConfig;
-    }
-
-    public FireDepartmentMetrics getMetrics()
-    {
-      return metrics;
-    }
-
-    public ObjectMapper getObjectMapper()
-    {
-      return objectMapper;
-    }
-
-    public Appenderator getAppenderator()
-    {
-      return appenderator;
-    }
-
-    public List<DataSegment> getPushedSegments()
-    {
-      return pushedSegments;
-    }
-
-    @Override
-    public void close() throws Exception
-    {
-      appenderator.close();
-      emitter.close();
-      FileUtils.deleteDirectory(tuningConfig.getBasePersistDirectory());
-    }
-
-    private static File createNewBasePersistDirectory()
-    {
-      return FileUtils.createTempDir("druid-batch-persist");
-    }
-
-
-    static class TestIndexTuningConfig implements AppenderatorConfig
-    {
-      private final AppendableIndexSpec appendableIndexSpec;
-      private final int maxRowsInMemory;
-      private final long maxBytesInMemory;
-      private final boolean skipBytesInMemoryOverheadCheck;
-      private final int maxColumnsToMerge;
-      private final PartitionsSpec partitionsSpec;
-      private final IndexSpec indexSpec;
-      private final File basePersistDirectory;
-      private final int maxPendingPersists;
-      private final boolean reportParseExceptions;
-      private final long pushTimeout;
-      private final IndexSpec indexSpecForIntermediatePersists;
-      @Nullable
-      private final SegmentWriteOutMediumFactory segmentWriteOutMediumFactory;
-      private final int numPersistThreads;
-
-      public TestIndexTuningConfig(
-          AppendableIndexSpec appendableIndexSpec,
-          Integer maxRowsInMemory,
-          Long maxBytesInMemory,
-          Boolean skipBytesInMemoryOverheadCheck,
-          IndexSpec indexSpec,
-          Integer maxPendingPersists,
-          Boolean reportParseExceptions,
-          Long pushTimeout,
-          @Nullable SegmentWriteOutMediumFactory segmentWriteOutMediumFactory,
-          Integer maxColumnsToMerge,
-          File basePersistDirectory,
-          Integer numPersistThreads
-      )
-      {
-        this.appendableIndexSpec = appendableIndexSpec;
-        this.maxRowsInMemory = maxRowsInMemory;
-        this.maxBytesInMemory = maxBytesInMemory;
-        this.skipBytesInMemoryOverheadCheck = skipBytesInMemoryOverheadCheck;
-        this.indexSpec = indexSpec;
-        this.maxPendingPersists = maxPendingPersists;
-        this.reportParseExceptions = reportParseExceptions;
-        this.pushTimeout = pushTimeout;
-        this.segmentWriteOutMediumFactory = segmentWriteOutMediumFactory;
-        this.maxColumnsToMerge = maxColumnsToMerge;
-        this.basePersistDirectory = basePersistDirectory;
-
-        this.partitionsSpec = null;
-        this.indexSpecForIntermediatePersists = this.indexSpec;
-
-        this.numPersistThreads = numPersistThreads == null ? DEFAULT_NUM_PERSIST_THREADS : numPersistThreads;
-      }
-
-      @Override
-      public TestIndexTuningConfig withBasePersistDirectory(File dir)
-      {
-        throw new UnsupportedOperationException();
-      }
-
-      @Override
-      public AppendableIndexSpec getAppendableIndexSpec()
-      {
-        return appendableIndexSpec;
-      }
-
-      @Override
-      public int getMaxRowsInMemory()
-      {
-        return maxRowsInMemory;
-      }
-
-      @Override
-      public long getMaxBytesInMemory()
-      {
-        return maxBytesInMemory;
-      }
-
-      @Override
-      public boolean isSkipBytesInMemoryOverheadCheck()
-      {
-        return skipBytesInMemoryOverheadCheck;
-      }
-
-      @Nullable
-      @Override
-      public PartitionsSpec getPartitionsSpec()
-      {
-        return partitionsSpec;
-      }
-
-      @Override
-      public IndexSpec getIndexSpec()
-      {
-        return indexSpec;
-      }
-
-      @Override
-      public IndexSpec getIndexSpecForIntermediatePersists()
-      {
-        return indexSpecForIntermediatePersists;
-      }
-
-      @Override
-      public int getMaxPendingPersists()
-      {
-        return maxPendingPersists;
-      }
-
-      @Override
-      public boolean isReportParseExceptions()
-      {
-        return reportParseExceptions;
-      }
-
-      @Nullable
-      @Override
-      public SegmentWriteOutMediumFactory getSegmentWriteOutMediumFactory()
-      {
-        return segmentWriteOutMediumFactory;
-      }
-
-      @Override
-      public int getMaxColumnsToMerge()
-      {
-        return maxColumnsToMerge;
-      }
-
-      @Override
-      public File getBasePersistDirectory()
-      {
-        return basePersistDirectory;
-      }
-
-      @Override
-      public Period getIntermediatePersistPeriod()
-      {
-        return new Period(Integer.MAX_VALUE); // intermediate persist doesn't make much sense for batch jobs
-      }
-
-      @Override
-      public int getNumPersistThreads()
-      {
-        return numPersistThreads;
-      }
-
-      @Override
-      public boolean equals(Object o)
-      {
-        if (this == o) {
-          return true;
-        }
-        if (o == null || getClass() != o.getClass()) {
-          return false;
-        }
-        TestIndexTuningConfig that = (TestIndexTuningConfig) o;
-        return Objects.equals(appendableIndexSpec, that.appendableIndexSpec) &&
-               maxRowsInMemory == that.maxRowsInMemory &&
-               maxBytesInMemory == that.maxBytesInMemory &&
-               skipBytesInMemoryOverheadCheck == that.skipBytesInMemoryOverheadCheck &&
-               maxColumnsToMerge == that.maxColumnsToMerge &&
-               maxPendingPersists == that.maxPendingPersists &&
-               reportParseExceptions == that.reportParseExceptions &&
-               pushTimeout == that.pushTimeout &&
-               numPersistThreads == that.numPersistThreads &&
-               Objects.equals(partitionsSpec, that.partitionsSpec) &&
-               Objects.equals(indexSpec, that.indexSpec) &&
-               Objects.equals(indexSpecForIntermediatePersists, that.indexSpecForIntermediatePersists) &&
-               Objects.equals(basePersistDirectory, that.basePersistDirectory) &&
-               Objects.equals(segmentWriteOutMediumFactory, that.segmentWriteOutMediumFactory);
-      }
-
-      @Override
-      public int hashCode()
-      {
-        return Objects.hash(
-            appendableIndexSpec,
-            maxRowsInMemory,
-            maxBytesInMemory,
-            skipBytesInMemoryOverheadCheck,
-            maxColumnsToMerge,
-            partitionsSpec,
-            indexSpec,
-            indexSpecForIntermediatePersists,
-            basePersistDirectory,
-            maxPendingPersists,
-            reportParseExceptions,
-            pushTimeout,
-            segmentWriteOutMediumFactory,
-            numPersistThreads
-        );
-      }
-
-      @Override
-      public String toString()
-      {
-        return "IndexTuningConfig{" +
-               "maxRowsInMemory=" + maxRowsInMemory +
-               ", maxBytesInMemory=" + maxBytesInMemory +
-               ", skipBytesInMemoryOverheadCheck=" + skipBytesInMemoryOverheadCheck +
-               ", maxColumnsToMerge=" + maxColumnsToMerge +
-               ", partitionsSpec=" + partitionsSpec +
-               ", indexSpec=" + indexSpec +
-               ", indexSpecForIntermediatePersists=" + indexSpecForIntermediatePersists +
-               ", basePersistDirectory=" + basePersistDirectory +
-               ", maxPendingPersists=" + maxPendingPersists +
-               ", reportParseExceptions=" + reportParseExceptions +
-               ", pushTimeout=" + pushTimeout +
-               ", segmentWriteOutMediumFactory=" + segmentWriteOutMediumFactory +
-               ", numPersistThreads=" + numPersistThreads +
-               '}';
-      }
-    }
-
-  }
-
-}
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/BatchAppenderatorsTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/BatchAppenderatorsTest.java
index bbc87327048..f789c1e641f 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/BatchAppenderatorsTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/BatchAppenderatorsTest.java
@@ -52,7 +52,7 @@ import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.join.NoopJoinableFactory;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.Appenderator;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorConfig;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorImpl;
@@ -114,7 +114,7 @@ public class BatchAppenderatorsTest
 
     private final DataSchema schema;
     private final AppenderatorConfig tuningConfig;
-    private final FireDepartmentMetrics metrics;
+    private final SegmentGenerationMetrics metrics;
     private final ObjectMapper objectMapper;
     private final Appenderator appenderator;
     private final ServiceEmitter emitter;
@@ -185,7 +185,7 @@ public class BatchAppenderatorsTest
           basePersistDirectory == null ? createNewBasePersistDirectory() : basePersistDirectory,
           null
       );
-      metrics = new FireDepartmentMetrics();
+      metrics = new SegmentGenerationMetrics();
 
       IndexIO indexIO = new IndexIO(objectMapper, ColumnConfig.DEFAULT);
       IndexMergerV9 indexMerger = new IndexMergerV9(
@@ -329,7 +329,7 @@ public class BatchAppenderatorsTest
       return tuningConfig;
     }
 
-    public FireDepartmentMetrics getMetrics()
+    public SegmentGenerationMetrics getMetrics()
     {
       return metrics;
     }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
index ce685c03cf2..134f5305169 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
@@ -24,7 +24,6 @@ import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonIgnore;
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.fasterxml.jackson.databind.ObjectMapper;
-import com.fasterxml.jackson.databind.exc.ValueInstantiationException;
 import com.fasterxml.jackson.databind.introspect.AnnotationIntrospectorPair;
 import com.fasterxml.jackson.databind.jsontype.NamedType;
 import com.fasterxml.jackson.databind.module.SimpleModule;
@@ -122,7 +121,6 @@ import org.apache.druid.segment.data.RoaringBitmapSerdeFactory;
 import org.apache.druid.segment.incremental.RowIngestionMetersFactory;
 import org.apache.druid.segment.indexing.BatchIOConfig;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
 import org.apache.druid.segment.indexing.TuningConfig;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.join.NoopJoinableFactory;
@@ -884,48 +882,6 @@ public class CompactionTaskTest
     Assert.assertEquals(compactionTuningConfig, CompactionTask.getTuningConfig(parallelIndexTuningConfig));
   }
 
-  @Test
-  public void testSerdeWithUnknownTuningConfigThrowingError() throws IOException
-  {
-    final OldCompactionTaskWithAnyTuningConfigType taskWithUnknownTuningConfig =
-        new OldCompactionTaskWithAnyTuningConfigType(
-            null,
-            null,
-            DATA_SOURCE,
-            null,
-            SEGMENTS,
-            null,
-            null,
-            null,
-            null,
-            null,
-            RealtimeTuningConfig.makeDefaultTuningConfig(null),
-            null,
-            OBJECT_MAPPER,
-            AuthTestUtils.TEST_AUTHORIZER_MAPPER,
-            null,
-            toolbox.getRowIngestionMetersFactory(),
-            COORDINATOR_CLIENT,
-            segmentCacheManagerFactory,
-            RETRY_POLICY_FACTORY,
-            toolbox.getAppenderatorsManager()
-        );
-
-    final ObjectMapper mapper = new DefaultObjectMapper((DefaultObjectMapper) OBJECT_MAPPER);
-    mapper.registerSubtypes(
-        new NamedType(OldCompactionTaskWithAnyTuningConfigType.class, "compact"),
-        new NamedType(RealtimeTuningConfig.class, "realtime")
-    );
-    final byte[] bytes = mapper.writeValueAsBytes(taskWithUnknownTuningConfig);
-
-    expectedException.expect(ValueInstantiationException.class);
-    expectedException.expectCause(CoreMatchers.instanceOf(IllegalStateException.class));
-    expectedException.expectMessage(
-        "Unknown tuningConfig type: [org.apache.druid.segment.indexing.RealtimeTuningConfig]"
-    );
-    mapper.readValue(bytes, CompactionTask.class);
-  }
-
   private static void assertEquals(CompactionTask expected, CompactionTask actual)
   {
     Assert.assertEquals(expected.getType(), actual.getType());
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java
index 2a364197b7b..f0e0198e35b 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java
@@ -79,6 +79,7 @@ import org.apache.druid.segment.VirtualColumns;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.segment.data.CompressionStrategy;
+import org.apache.druid.segment.handoff.NoopSegmentHandoffNotifierFactory;
 import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
 import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
@@ -93,7 +94,6 @@ import org.apache.druid.segment.loading.SegmentLocalCacheManager;
 import org.apache.druid.segment.loading.StorageLocation;
 import org.apache.druid.segment.loading.StorageLocationConfig;
 import org.apache.druid.segment.realtime.firehose.WindowedStorageAdapter;
-import org.apache.druid.segment.realtime.plumber.NoopSegmentHandoffNotifierFactory;
 import org.apache.druid.segment.transform.ExpressionTransform;
 import org.apache.druid.segment.transform.TransformSpec;
 import org.apache.druid.server.metrics.NoopServiceEmitter;
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/RealtimeIndexTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/RealtimeIndexTaskTest.java
deleted file mode 100644
index b41848ea57b..00000000000
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/RealtimeIndexTaskTest.java
+++ /dev/null
@@ -1,1052 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.indexing.common.task;
-
-import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
-import com.google.common.util.concurrent.ListenableFuture;
-import com.google.common.util.concurrent.ListeningExecutorService;
-import com.google.common.util.concurrent.MoreExecutors;
-import org.apache.druid.client.cache.CacheConfig;
-import org.apache.druid.client.cache.CachePopulatorStats;
-import org.apache.druid.client.cache.MapCache;
-import org.apache.druid.client.coordinator.NoopCoordinatorClient;
-import org.apache.druid.client.indexing.NoopOverlordClient;
-import org.apache.druid.common.config.NullHandling;
-import org.apache.druid.data.input.FirehoseFactory;
-import org.apache.druid.data.input.impl.DimensionsSpec;
-import org.apache.druid.data.input.impl.MapInputRowParser;
-import org.apache.druid.data.input.impl.TimeAndDimsParseSpec;
-import org.apache.druid.data.input.impl.TimestampSpec;
-import org.apache.druid.discovery.DataNodeService;
-import org.apache.druid.discovery.DruidNodeAnnouncer;
-import org.apache.druid.discovery.LookupNodeService;
-import org.apache.druid.error.DruidException;
-import org.apache.druid.indexer.TaskState;
-import org.apache.druid.indexer.TaskStatus;
-import org.apache.druid.indexing.common.SegmentCacheManagerFactory;
-import org.apache.druid.indexing.common.TaskToolbox;
-import org.apache.druid.indexing.common.TaskToolboxFactory;
-import org.apache.druid.indexing.common.TestFirehose;
-import org.apache.druid.indexing.common.TestUtils;
-import org.apache.druid.indexing.common.actions.LocalTaskActionClientFactory;
-import org.apache.druid.indexing.common.actions.TaskActionClientFactory;
-import org.apache.druid.indexing.common.actions.TaskActionToolbox;
-import org.apache.druid.indexing.common.actions.TaskAuditLogConfig;
-import org.apache.druid.indexing.common.config.TaskConfig;
-import org.apache.druid.indexing.common.config.TaskConfigBuilder;
-import org.apache.druid.indexing.common.config.TaskStorageConfig;
-import org.apache.druid.indexing.overlord.HeapMemoryTaskStorage;
-import org.apache.druid.indexing.overlord.IndexerMetadataStorageCoordinator;
-import org.apache.druid.indexing.overlord.TaskLockbox;
-import org.apache.druid.indexing.overlord.TaskStorage;
-import org.apache.druid.indexing.overlord.supervisor.SupervisorManager;
-import org.apache.druid.indexing.test.TestDataSegmentAnnouncer;
-import org.apache.druid.indexing.test.TestDataSegmentKiller;
-import org.apache.druid.indexing.test.TestDataSegmentPusher;
-import org.apache.druid.indexing.test.TestIndexerMetadataStorageCoordinator;
-import org.apache.druid.jackson.DefaultObjectMapper;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.Pair;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.UOE;
-import org.apache.druid.java.util.common.concurrent.Execs;
-import org.apache.druid.java.util.common.granularity.Granularities;
-import org.apache.druid.java.util.common.jackson.JacksonUtils;
-import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.java.util.common.parsers.ParseException;
-import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.java.util.emitter.core.NoopEmitter;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.java.util.metrics.MonitorScheduler;
-import org.apache.druid.math.expr.ExprMacroTable;
-import org.apache.druid.query.DefaultQueryRunnerFactoryConglomerate;
-import org.apache.druid.query.DirectQueryProcessingPool;
-import org.apache.druid.query.Druids;
-import org.apache.druid.query.Query;
-import org.apache.druid.query.QueryPlus;
-import org.apache.druid.query.QueryRunnerFactoryConglomerate;
-import org.apache.druid.query.QueryWatcher;
-import org.apache.druid.query.Result;
-import org.apache.druid.query.SegmentDescriptor;
-import org.apache.druid.query.aggregation.AggregatorFactory;
-import org.apache.druid.query.aggregation.CountAggregatorFactory;
-import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
-import org.apache.druid.query.filter.DimFilter;
-import org.apache.druid.query.filter.SelectorDimFilter;
-import org.apache.druid.query.timeseries.TimeseriesQuery;
-import org.apache.druid.query.timeseries.TimeseriesQueryEngine;
-import org.apache.druid.query.timeseries.TimeseriesQueryQueryToolChest;
-import org.apache.druid.query.timeseries.TimeseriesQueryRunnerFactory;
-import org.apache.druid.query.timeseries.TimeseriesResultValue;
-import org.apache.druid.segment.TestHelper;
-import org.apache.druid.segment.TestIndex;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.apache.druid.segment.join.NoopJoinableFactory;
-import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.firehose.NoopChatHandlerProvider;
-import org.apache.druid.segment.realtime.plumber.ServerTimeRejectionPolicyFactory;
-import org.apache.druid.segment.transform.ExpressionTransform;
-import org.apache.druid.segment.transform.TransformSpec;
-import org.apache.druid.server.DruidNode;
-import org.apache.druid.server.coordination.DataSegmentServerAnnouncer;
-import org.apache.druid.server.coordination.ServerType;
-import org.apache.druid.server.security.AuthTestUtils;
-import org.apache.druid.testing.InitializedNullHandlingTest;
-import org.apache.druid.timeline.DataSegment;
-import org.easymock.EasyMock;
-import org.hamcrest.CoreMatchers;
-import org.joda.time.DateTime;
-import org.joda.time.Period;
-import org.junit.After;
-import org.junit.Assert;
-import org.junit.Before;
-import org.junit.Rule;
-import org.junit.Test;
-import org.junit.internal.matchers.ThrowableMessageMatcher;
-import org.junit.rules.ExpectedException;
-import org.junit.rules.TemporaryFolder;
-
-import javax.annotation.Nullable;
-import java.io.File;
-import java.nio.file.Files;
-import java.util.Arrays;
-import java.util.HashSet;
-import java.util.List;
-import java.util.Map;
-import java.util.concurrent.Callable;
-import java.util.concurrent.ConcurrentHashMap;
-import java.util.concurrent.ExecutionException;
-import java.util.concurrent.Executor;
-
-public class RealtimeIndexTaskTest extends InitializedNullHandlingTest
-{
-  private static final Logger log = new Logger(RealtimeIndexTaskTest.class);
-  private static final ServiceEmitter EMITTER = new ServiceEmitter(
-      "service",
-      "host",
-      new NoopEmitter()
-  );
-
-  @Rule
-  public final ExpectedException expectedException = ExpectedException.none();
-
-  @Rule
-  public final TemporaryFolder tempFolder = new TemporaryFolder();
-
-  private DateTime now;
-  private ListeningExecutorService taskExec;
-  private Map<SegmentDescriptor, Pair<Executor, Runnable>> handOffCallbacks;
-
-  @Before
-  public void setUp()
-  {
-    EmittingLogger.registerEmitter(EMITTER);
-    EMITTER.start();
-    taskExec = MoreExecutors.listeningDecorator(Execs.singleThreaded("realtime-index-task-test-%d"));
-    now = DateTimes.nowUtc();
-  }
-
-  @After
-  public void tearDown()
-  {
-    taskExec.shutdownNow();
-  }
-
-  @Test
-  public void testMakeTaskId()
-  {
-    Assert.assertEquals(
-        "index_realtime_test_0_2015-01-02T00:00:00.000Z_abcdefgh",
-        RealtimeIndexTask.makeTaskId("test", 0, DateTimes.of("2015-01-02"), "abcdefgh")
-    );
-  }
-
-  @Test(timeout = 60_000L)
-  public void testDefaultResource()
-  {
-    final RealtimeIndexTask task = makeRealtimeTask(null);
-    Assert.assertEquals(task.getId(), task.getTaskResource().getAvailabilityGroup());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testSupportsQueries()
-  {
-    final RealtimeIndexTask task = makeRealtimeTask(null);
-    Assert.assertTrue(task.supportsQueries());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testInputSourceResources()
-  {
-    final RealtimeIndexTask task = makeRealtimeTask(null);
-    Assert.assertThrows(
-        UOE.class,
-        task::getInputSourceResources
-    );
-  }
-
-  @Test(timeout = 60_000L, expected = ExecutionException.class)
-  public void testHandoffTimeout() throws Exception
-  {
-    final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-    final RealtimeIndexTask task = makeRealtimeTask(null, TransformSpec.NONE, true, 100L);
-    final TaskToolbox taskToolbox = makeToolbox(task, mdc, tempFolder.newFolder());
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task, taskToolbox);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        ImmutableList.of(
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1")
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    while (mdc.getPublished().isEmpty()) {
-      Thread.sleep(50);
-    }
-
-    Assert.assertEquals(1, task.getMetrics().processed());
-    Assert.assertNotNull(Iterables.getOnlyElement(mdc.getPublished()));
-
-
-    // handoff would timeout, resulting in exception
-    statusFuture.get();
-  }
-
-  @Test(timeout = 60_000L)
-  public void testBasics() throws Exception
-  {
-    final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-    final RealtimeIndexTask task = makeRealtimeTask(null);
-    final TaskToolbox taskToolbox = makeToolbox(task, mdc, tempFolder.newFolder());
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task, taskToolbox);
-    final DataSegment publishedSegment;
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        ImmutableList.of(
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1"),
-            ImmutableMap.of("t", now.minus(new Period("P1D")).getMillis(), "dim1", "foo", "met1", 2.0),
-            ImmutableMap.of("t", now.getMillis(), "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    while (mdc.getPublished().isEmpty()) {
-      Thread.sleep(50);
-    }
-
-    publishedSegment = Iterables.getOnlyElement(mdc.getPublished());
-
-    // Check metrics.
-    Assert.assertEquals(2, task.getMetrics().processed());
-    Assert.assertEquals(1, task.getMetrics().thrownAway());
-    Assert.assertEquals(0, task.getMetrics().unparseable());
-
-    // Do some queries.
-    Assert.assertEquals(2, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(3, sumMetric(task, null, "met1").longValue());
-
-    // Simulate handoff.
-    for (Map.Entry<SegmentDescriptor, Pair<Executor, Runnable>> entry : handOffCallbacks.entrySet()) {
-      final Pair<Executor, Runnable> executorRunnablePair = entry.getValue();
-      Assert.assertEquals(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          ),
-          entry.getKey()
-      );
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testTransformSpec() throws Exception
-  {
-    final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-    final TransformSpec transformSpec = new TransformSpec(
-        new SelectorDimFilter("dim1", "foo", null),
-        ImmutableList.of(
-            new ExpressionTransform("dim1t", "concat(dim1,dim1)", ExprMacroTable.nil())
-        )
-    );
-    final RealtimeIndexTask task = makeRealtimeTask(null, transformSpec, true, 0);
-    final TaskToolbox taskToolbox = makeToolbox(task, mdc, tempFolder.newFolder());
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task, taskToolbox);
-    final DataSegment publishedSegment;
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        ImmutableList.of(
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1"),
-            ImmutableMap.of("t", now.minus(new Period("P1D")).getMillis(), "dim1", "foo", "met1", 2.0),
-            ImmutableMap.of("t", now.getMillis(), "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    while (mdc.getPublished().isEmpty()) {
-      Thread.sleep(50);
-    }
-
-    publishedSegment = Iterables.getOnlyElement(mdc.getPublished());
-
-    // Check metrics.
-    Assert.assertEquals(1, task.getMetrics().processed());
-    Assert.assertEquals(2, task.getMetrics().thrownAway());
-    Assert.assertEquals(0, task.getMetrics().unparseable());
-
-    // Do some queries.
-    Assert.assertEquals(1, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(1, sumMetric(task, new SelectorDimFilter("dim1t", "foofoo", null), "rows").longValue());
-    if (NullHandling.replaceWithDefault()) {
-      Assert.assertEquals(0, sumMetric(task, new SelectorDimFilter("dim1t", "barbar", null), "rows").longValue());
-    } else {
-      Assert.assertNull(sumMetric(task, new SelectorDimFilter("dim1t", "barbar", null), "rows"));
-
-    }
-    Assert.assertEquals(1, sumMetric(task, null, "met1").longValue());
-
-    // Simulate handoff.
-    for (Map.Entry<SegmentDescriptor, Pair<Executor, Runnable>> entry : handOffCallbacks.entrySet()) {
-      final Pair<Executor, Runnable> executorRunnablePair = entry.getValue();
-      Assert.assertEquals(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          ),
-          entry.getKey()
-      );
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testReportParseExceptionsOnBadMetric() throws Exception
-  {
-    final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-    final RealtimeIndexTask task = makeRealtimeTask(null, true);
-    final TaskToolbox taskToolbox = makeToolbox(task, mdc, tempFolder.newFolder());
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task, taskToolbox);
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        ImmutableList.of(
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1"),
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "foo"),
-            ImmutableMap.of("t", now.minus(new Period("P1D")).getMillis(), "dim1", "foo", "met1", "foo"),
-            ImmutableMap.of("t", now.getMillis(), "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for the task to finish.
-    expectedException.expect(ExecutionException.class);
-    expectedException.expectCause(CoreMatchers.instanceOf(ParseException.class));
-    expectedException.expectCause(
-        ThrowableMessageMatcher.hasMessage(
-            CoreMatchers.containsString("[Unable to parse value[foo] for field[met1]")
-        )
-    );
-
-    statusFuture.get();
-  }
-
-  @Test(timeout = 60_000L)
-  public void testNoReportParseExceptions() throws Exception
-  {
-    final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-    final RealtimeIndexTask task = makeRealtimeTask(null, false);
-    final TaskToolbox taskToolbox = makeToolbox(task, mdc, tempFolder.newFolder());
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task, taskToolbox);
-    final DataSegment publishedSegment;
-
-    // Wait for firehose to show up, it starts off null.
-    while (task.getFirehose() == null) {
-      Thread.sleep(50);
-    }
-
-    final TestFirehose firehose = (TestFirehose) task.getFirehose();
-
-    firehose.addRows(
-        Arrays.asList(
-            // Good row- will be processed.
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "1"),
-
-            // Null row- will be thrown away.
-            null,
-
-            // Bad metric- will count as processed, but that particular metric won't update.
-            ImmutableMap.of("t", now.getMillis(), "dim1", "foo", "met1", "foo"),
-
-            // Bad row- will be unparseable.
-            ImmutableMap.of("dim1", "foo", "met1", 2.0, TestFirehose.FAIL_DIM, "x"),
-
-            // Old row- will be thrownAway.
-            ImmutableMap.of("t", now.minus(Period.days(1)).getMillis(), "dim1", "foo", "met1", 2.0),
-
-            // Good row- will be processed.
-            ImmutableMap.of("t", now.getMillis(), "dim2", "bar", "met1", 2.0)
-        )
-    );
-
-    // Stop the firehose, this will drain out existing events.
-    firehose.close();
-
-    // Wait for publish.
-    while (mdc.getPublished().isEmpty()) {
-      Thread.sleep(50);
-    }
-
-    publishedSegment = Iterables.getOnlyElement(mdc.getPublished());
-
-    // Check metrics.
-    Assert.assertEquals(3, task.getMetrics().processed());
-    Assert.assertEquals(1, task.getMetrics().thrownAway());
-    Assert.assertEquals(2, task.getMetrics().unparseable());
-
-    // Do some queries.
-    Assert.assertEquals(3, sumMetric(task, null, "rows").longValue());
-    Assert.assertEquals(3, sumMetric(task, null, "met1").longValue());
-
-    // Simulate handoff.
-    for (Map.Entry<SegmentDescriptor, Pair<Executor, Runnable>> entry : handOffCallbacks.entrySet()) {
-      final Pair<Executor, Runnable> executorRunnablePair = entry.getValue();
-      Assert.assertEquals(
-          new SegmentDescriptor(
-              publishedSegment.getInterval(),
-              publishedSegment.getVersion(),
-              publishedSegment.getShardSpec().getPartitionNum()
-          ),
-          entry.getKey()
-      );
-      executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    }
-    handOffCallbacks.clear();
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testRestore() throws Exception
-  {
-    final File directory = tempFolder.newFolder();
-    final RealtimeIndexTask task1 = makeRealtimeTask(null);
-    final DataSegment publishedSegment;
-
-    // First run:
-    {
-      final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-      final TaskToolbox taskToolbox = makeToolbox(task1, mdc, directory);
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task1, taskToolbox);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task1.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      final TestFirehose firehose = (TestFirehose) task1.getFirehose();
-
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim1", "foo")
-          )
-      );
-
-      // Trigger graceful shutdown.
-      task1.stopGracefully(taskToolbox.getConfig());
-
-      // Wait for the task to finish. The status doesn't really matter, but we'll check it anyway.
-      final TaskStatus taskStatus = statusFuture.get();
-      Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-
-      // Nothing should be published.
-      Assert.assertEquals(new HashSet<>(), mdc.getPublished());
-    }
-
-    // Second run:
-    {
-      final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-      final RealtimeIndexTask task2 = makeRealtimeTask(task1.getId());
-      final TaskToolbox taskToolbox = makeToolbox(task2, mdc, directory);
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task2, taskToolbox);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task2.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      // Do a query, at this point the previous data should be loaded.
-      Assert.assertEquals(1, sumMetric(task2, null, "rows").longValue());
-
-      final TestFirehose firehose = (TestFirehose) task2.getFirehose();
-
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim2", "bar")
-          )
-      );
-
-      // Stop the firehose, this will drain out existing events.
-      firehose.close();
-
-      // Wait for publish.
-      while (mdc.getPublished().isEmpty()) {
-        Thread.sleep(50);
-      }
-
-      publishedSegment = Iterables.getOnlyElement(mdc.getPublished());
-
-      // Do a query.
-      Assert.assertEquals(2, sumMetric(task2, null, "rows").longValue());
-
-      // Simulate handoff.
-      for (Map.Entry<SegmentDescriptor, Pair<Executor, Runnable>> entry : handOffCallbacks.entrySet()) {
-        final Pair<Executor, Runnable> executorRunnablePair = entry.getValue();
-        Assert.assertEquals(
-            new SegmentDescriptor(
-                publishedSegment.getInterval(),
-                publishedSegment.getVersion(),
-                publishedSegment.getShardSpec().getPartitionNum()
-            ),
-            entry.getKey()
-        );
-        executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-      }
-      handOffCallbacks.clear();
-
-      // Wait for the task to finish.
-      final TaskStatus taskStatus = statusFuture.get();
-      Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-    }
-  }
-
-  @Test(timeout = 60_000L)
-  public void testRestoreAfterHandoffAttemptDuringShutdown() throws Exception
-  {
-    final TaskStorage taskStorage = new HeapMemoryTaskStorage(new TaskStorageConfig(null));
-    final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-    final File directory = tempFolder.newFolder();
-    final RealtimeIndexTask task1 = makeRealtimeTask(null);
-    final DataSegment publishedSegment;
-
-    // First run:
-    {
-      final TaskToolbox taskToolbox = makeToolbox(task1, taskStorage, mdc, directory);
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task1, taskToolbox);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task1.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      final TestFirehose firehose = (TestFirehose) task1.getFirehose();
-
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim1", "foo")
-          )
-      );
-
-      // Stop the firehose, this will trigger a finishJob.
-      firehose.close();
-
-      // Wait for publish.
-      while (mdc.getPublished().isEmpty()) {
-        Thread.sleep(50);
-      }
-
-      publishedSegment = Iterables.getOnlyElement(mdc.getPublished());
-
-      // Do a query.
-      Assert.assertEquals(1, sumMetric(task1, null, "rows").longValue());
-
-      // Trigger graceful shutdown.
-      task1.stopGracefully(taskToolbox.getConfig());
-
-      // Wait for the task to finish. The status doesn't really matter.
-      while (!statusFuture.isDone()) {
-        Thread.sleep(50);
-      }
-    }
-
-    // Second run:
-    {
-      final RealtimeIndexTask task2 = makeRealtimeTask(task1.getId());
-      final TaskToolbox taskToolbox = makeToolbox(task2, taskStorage, mdc, directory);
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task2, taskToolbox);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task2.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      // Stop the firehose again, this will start another handoff.
-      final TestFirehose firehose = (TestFirehose) task2.getFirehose();
-
-      // Stop the firehose, this will trigger a finishJob.
-      firehose.close();
-
-      // publishedSegment is still published. No reason it shouldn't be.
-      Assert.assertEquals(ImmutableSet.of(publishedSegment), mdc.getPublished());
-
-      // Wait for a handoffCallback to show up.
-      while (handOffCallbacks.isEmpty()) {
-        Thread.sleep(50);
-      }
-
-      // Simulate handoff.
-      for (Map.Entry<SegmentDescriptor, Pair<Executor, Runnable>> entry : handOffCallbacks.entrySet()) {
-        final Pair<Executor, Runnable> executorRunnablePair = entry.getValue();
-        Assert.assertEquals(
-            new SegmentDescriptor(
-                publishedSegment.getInterval(),
-                publishedSegment.getVersion(),
-                publishedSegment.getShardSpec().getPartitionNum()
-            ),
-            entry.getKey()
-        );
-        executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-      }
-      handOffCallbacks.clear();
-
-      // Wait for the task to finish.
-      final TaskStatus taskStatus = statusFuture.get();
-      Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-    }
-  }
-
-  @Test(timeout = 60_000L)
-  public void testRestoreCorruptData() throws Exception
-  {
-    final File directory = tempFolder.newFolder();
-    final RealtimeIndexTask task1 = makeRealtimeTask(null);
-
-    // First run:
-    {
-      final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-      final TaskToolbox taskToolbox = makeToolbox(task1, mdc, directory);
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task1, taskToolbox);
-
-      // Wait for firehose to show up, it starts off null.
-      while (task1.getFirehose() == null) {
-        Thread.sleep(50);
-      }
-
-      final TestFirehose firehose = (TestFirehose) task1.getFirehose();
-
-      firehose.addRows(
-          ImmutableList.of(
-              ImmutableMap.of("t", now.getMillis(), "dim1", "foo")
-          )
-      );
-
-      // Trigger graceful shutdown.
-      task1.stopGracefully(taskToolbox.getConfig());
-
-      // Wait for the task to finish. The status doesn't really matter, but we'll check it anyway.
-      final TaskStatus taskStatus = statusFuture.get();
-      Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-
-      // Nothing should be published.
-      Assert.assertEquals(new HashSet<>(), mdc.getPublished());
-    }
-
-    // Corrupt the data:
-    final File smooshFile = new File(
-        StringUtils.format(
-            "%s/persistent/task/%s/work/persist/%s/%s_%s/0/00000.smoosh",
-            directory,
-            task1.getId(),
-            task1.getDataSource(),
-            Granularities.DAY.bucketStart(now),
-            Granularities.DAY.bucketEnd(now)
-        )
-    );
-
-    Files.write(smooshFile.toPath(), StringUtils.toUtf8("oops!"));
-
-    // Second run:
-    {
-      final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-      final RealtimeIndexTask task2 = makeRealtimeTask(task1.getId());
-      final TaskToolbox taskToolbox = makeToolbox(task2, mdc, directory);
-      final ListenableFuture<TaskStatus> statusFuture = runTask(task2, taskToolbox);
-
-      // Wait for the task to finish.
-      boolean caught = false;
-      try {
-        statusFuture.get();
-      }
-      catch (Exception e) {
-        caught = true;
-      }
-      Assert.assertTrue("expected exception", caught);
-    }
-  }
-
-  @Test(timeout = 60_000L)
-  public void testStopBeforeStarting() throws Exception
-  {
-    final File directory = tempFolder.newFolder();
-    final RealtimeIndexTask task1 = makeRealtimeTask(null);
-
-    final TestIndexerMetadataStorageCoordinator mdc = new TestIndexerMetadataStorageCoordinator();
-    final TaskToolbox taskToolbox = makeToolbox(task1, mdc, directory);
-    task1.stopGracefully(taskToolbox.getConfig());
-    final ListenableFuture<TaskStatus> statusFuture = runTask(task1, taskToolbox);
-
-    // Wait for the task to finish.
-    final TaskStatus taskStatus = statusFuture.get();
-    Assert.assertEquals(TaskState.SUCCESS, taskStatus.getStatusCode());
-  }
-
-  private ListenableFuture<TaskStatus> runTask(final Task task, final TaskToolbox toolbox)
-  {
-    return taskExec.submit(
-        new Callable<TaskStatus>()
-        {
-          @Override
-          public TaskStatus call() throws Exception
-          {
-            try {
-              if (task.isReady(toolbox.getTaskActionClient())) {
-                return task.run(toolbox);
-              } else {
-                throw new ISE("Task is not ready");
-              }
-            }
-            catch (Exception e) {
-              log.warn(e, "Task failed");
-              throw e;
-            }
-          }
-        }
-    );
-  }
-
-  private RealtimeIndexTask makeRealtimeTask(final String taskId)
-  {
-    return makeRealtimeTask(taskId, TransformSpec.NONE, true, 0);
-  }
-
-  private RealtimeIndexTask makeRealtimeTask(final String taskId, boolean reportParseExceptions)
-  {
-    return makeRealtimeTask(taskId, TransformSpec.NONE, reportParseExceptions, 0);
-  }
-
-  private RealtimeIndexTask makeRealtimeTask(
-      final String taskId,
-      final TransformSpec transformSpec,
-      final boolean reportParseExceptions,
-      final long handoffTimeout
-  )
-  {
-    ObjectMapper objectMapper = new DefaultObjectMapper();
-    DataSchema dataSchema = new DataSchema(
-        "test_ds",
-        TestHelper.makeJsonMapper().convertValue(
-            new MapInputRowParser(
-                new TimeAndDimsParseSpec(
-                    new TimestampSpec("t", "auto", null),
-                    new DimensionsSpec(
-                        DimensionsSpec.getDefaultSchemas(ImmutableList.of("dim1", "dim2", "dim1t"))
-                    )
-                )
-            ),
-            JacksonUtils.TYPE_REFERENCE_MAP_STRING_OBJECT
-        ),
-        new AggregatorFactory[]{new CountAggregatorFactory("rows"), new LongSumAggregatorFactory("met1", "met1")},
-        new UniformGranularitySpec(Granularities.DAY, Granularities.NONE, null),
-        transformSpec,
-        objectMapper
-    );
-    RealtimeIOConfig realtimeIOConfig = new RealtimeIOConfig(
-        new TestFirehose.TestFirehoseFactory(),
-        null
-    );
-    RealtimeTuningConfig realtimeTuningConfig = new RealtimeTuningConfig(
-        null,
-        1000,
-        null,
-        null,
-        new Period("P1Y"),
-        new Period("PT10M"),
-        null,
-        null,
-        new ServerTimeRejectionPolicyFactory(),
-        null,
-        null,
-        null,
-        null,
-        0,
-        0,
-        reportParseExceptions,
-        handoffTimeout,
-        null,
-        null,
-        null,
-        null
-    );
-    return new RealtimeIndexTask(
-        taskId,
-        null,
-        new FireDepartment(dataSchema, realtimeIOConfig, realtimeTuningConfig),
-        null
-    )
-    {
-      @Override
-      protected boolean isFirehoseDrainableByClosing(FirehoseFactory firehoseFactory)
-      {
-        return true;
-      }
-    };
-  }
-
-  private TaskToolbox makeToolbox(
-      final Task task,
-      final IndexerMetadataStorageCoordinator mdc,
-      final File directory
-  )
-  {
-    return makeToolbox(
-        task,
-        new HeapMemoryTaskStorage(new TaskStorageConfig(null)),
-        mdc,
-        directory
-    );
-  }
-
-  private TaskToolbox makeToolbox(
-      final Task task,
-      final TaskStorage taskStorage,
-      final IndexerMetadataStorageCoordinator mdc,
-      final File directory
-  )
-  {
-    final TaskConfig taskConfig = new TaskConfigBuilder()
-        .setBaseDir(directory.getPath())
-        .setDefaultRowFlushBoundary(50000)
-        .setRestoreTasksOnRestart(true)
-        .setBatchProcessingMode(TaskConfig.BATCH_PROCESSING_MODE_DEFAULT.name())
-        .build();
-    final TaskLockbox taskLockbox = new TaskLockbox(taskStorage, mdc);
-    try {
-      taskStorage.insert(task, TaskStatus.running(task.getId()));
-    }
-    catch (DruidException e) {
-      log.noStackTrace().info(e, "Suppressing exception while inserting task [%s]", task.getId());
-    }
-    taskLockbox.syncFromStorage();
-    final TaskActionToolbox taskActionToolbox = new TaskActionToolbox(
-        taskLockbox,
-        taskStorage,
-        mdc,
-        EMITTER,
-        EasyMock.createMock(SupervisorManager.class),
-        new DefaultObjectMapper()
-    );
-    final TaskActionClientFactory taskActionClientFactory = new LocalTaskActionClientFactory(
-        taskStorage,
-        taskActionToolbox,
-        new TaskAuditLogConfig(false)
-    );
-    final QueryRunnerFactoryConglomerate conglomerate = new DefaultQueryRunnerFactoryConglomerate(
-        ImmutableMap.of(
-            TimeseriesQuery.class,
-            new TimeseriesQueryRunnerFactory(
-                new TimeseriesQueryQueryToolChest(),
-                new TimeseriesQueryEngine(),
-                new QueryWatcher()
-                {
-                  @Override
-                  public void registerQueryFuture(Query query, ListenableFuture future)
-                  {
-                    // do nothing
-                  }
-                }
-            )
-        )
-    );
-    handOffCallbacks = new ConcurrentHashMap<>();
-    final SegmentHandoffNotifierFactory handoffNotifierFactory = new SegmentHandoffNotifierFactory()
-    {
-      @Override
-      public SegmentHandoffNotifier createSegmentHandoffNotifier(String dataSource)
-      {
-        return new SegmentHandoffNotifier()
-        {
-          @Override
-          public boolean registerSegmentHandoffCallback(
-              SegmentDescriptor descriptor,
-              Executor exec,
-              Runnable handOffRunnable
-          )
-          {
-            handOffCallbacks.put(descriptor, new Pair<>(exec, handOffRunnable));
-            return true;
-          }
-
-          @Override
-          public void start()
-          {
-            //Noop
-          }
-
-          @Override
-          public void close()
-          {
-            //Noop
-          }
-
-        };
-      }
-    };
-    final TestUtils testUtils = new TestUtils();
-    final TaskToolboxFactory toolboxFactory = new TaskToolboxFactory(
-        null,
-        taskConfig,
-        null, // taskExecutorNode
-        taskActionClientFactory,
-        EMITTER,
-        new TestDataSegmentPusher(),
-        new TestDataSegmentKiller(),
-        null, // DataSegmentMover
-        null, // DataSegmentArchiver
-        new TestDataSegmentAnnouncer(),
-        EasyMock.createNiceMock(DataSegmentServerAnnouncer.class),
-        handoffNotifierFactory,
-        () -> conglomerate,
-        DirectQueryProcessingPool.INSTANCE,
-        NoopJoinableFactory.INSTANCE,
-        () -> EasyMock.createMock(MonitorScheduler.class),
-        new SegmentCacheManagerFactory(TestIndex.INDEX_IO, testUtils.getTestObjectMapper()),
-        testUtils.getTestObjectMapper(),
-        testUtils.getTestIndexIO(),
-        MapCache.create(1024),
-        new CacheConfig(),
-        new CachePopulatorStats(),
-        testUtils.getIndexMergerV9Factory(),
-        EasyMock.createNiceMock(DruidNodeAnnouncer.class),
-        EasyMock.createNiceMock(DruidNode.class),
-        new LookupNodeService("tier"),
-        new DataNodeService("tier", 1000, ServerType.INDEXER_EXECUTOR, 0),
-        new NoopTestTaskReportFileWriter(),
-        null,
-        AuthTestUtils.TEST_AUTHORIZER_MAPPER,
-        new NoopChatHandlerProvider(),
-        testUtils.getRowIngestionMetersFactory(),
-        new TestAppenderatorsManager(),
-        new NoopOverlordClient(),
-        new NoopCoordinatorClient(),
-        null,
-        null,
-        null,
-        "1",
-        CentralizedDatasourceSchemaConfig.create()
-    );
-
-    return toolboxFactory.build(task);
-  }
-
-  @Nullable
-  public Long sumMetric(final Task task, final DimFilter filter, final String metric)
-  {
-    // Do a query.
-    TimeseriesQuery query = Druids.newTimeseriesQueryBuilder()
-                                  .dataSource("test_ds")
-                                  .filters(filter)
-                                  .aggregators(
-                                      ImmutableList.of(
-                                          new LongSumAggregatorFactory(metric, metric)
-                                      )
-                                  ).granularity(Granularities.ALL)
-                                  .intervals("2000/3000")
-                                  .build();
-
-    List<Result<TimeseriesResultValue>> results = task.getQueryRunner(query).run(QueryPlus.wrap(query)).toList();
-    if (results.isEmpty()) {
-      return 0L;
-    } else {
-      return results.get(0).getValue().getLongMetric(metric);
-    }
-  }
-}
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TaskSerdeTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TaskSerdeTest.java
index 8c0cbd92562..b217f8d5bd8 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TaskSerdeTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TaskSerdeTest.java
@@ -47,12 +47,8 @@ import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.aggregation.DoubleSumAggregatorFactory;
 import org.apache.druid.segment.IndexSpec;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.apache.druid.segment.realtime.FireDepartment;
 import org.apache.druid.server.security.AuthTestUtils;
-import org.apache.druid.timeline.partition.NoneShardSpec;
 import org.hamcrest.CoreMatchers;
 import org.joda.time.Period;
 import org.junit.Assert;
@@ -387,92 +383,6 @@ public class TaskSerdeTest
     Assert.assertTrue(task2.getIngestionSchema().getIOConfig().getInputSource() instanceof LocalInputSource);
   }
 
-  @Test
-  public void testRealtimeIndexTaskSerde() throws Exception
-  {
-
-    final RealtimeIndexTask task = new RealtimeIndexTask(
-        null,
-        new TaskResource("rofl", 2),
-        new FireDepartment(
-            new DataSchema(
-                "foo",
-                null,
-                new AggregatorFactory[0],
-                new UniformGranularitySpec(Granularities.HOUR, Granularities.NONE, null),
-                null,
-                jsonMapper
-            ),
-            new RealtimeIOConfig(
-                new MockFirehoseFactory(),
-                (schema, config, metrics) -> null
-            ),
-
-            new RealtimeTuningConfig(
-                null,
-                1,
-                10L,
-                null,
-                new Period("PT10M"),
-                null,
-                null,
-                null,
-                null,
-                1,
-                NoneShardSpec.instance(),
-                indexSpec,
-                null,
-                0,
-                0,
-                true,
-                null,
-                null,
-                null,
-                null,
-                null
-            )
-        ),
-        null
-    );
-
-    final String json = jsonMapper.writeValueAsString(task);
-
-    Thread.sleep(100); // Just want to run the clock a bit to make sure the task id doesn't change
-    final RealtimeIndexTask task2 = (RealtimeIndexTask) jsonMapper.readValue(json, Task.class);
-
-    Assert.assertEquals("foo", task.getDataSource());
-    Assert.assertEquals(2, task.getTaskResource().getRequiredCapacity());
-    Assert.assertEquals("rofl", task.getTaskResource().getAvailabilityGroup());
-    Assert.assertEquals(
-        new Period("PT10M"),
-        task.getRealtimeIngestionSchema()
-            .getTuningConfig().getWindowPeriod()
-    );
-    Assert.assertEquals(
-        Granularities.HOUR,
-        task.getRealtimeIngestionSchema().getDataSchema().getGranularitySpec().getSegmentGranularity()
-    );
-    Assert.assertTrue(task.getRealtimeIngestionSchema().getTuningConfig().isReportParseExceptions());
-
-    Assert.assertEquals(task.getId(), task2.getId());
-    Assert.assertEquals(task.getGroupId(), task2.getGroupId());
-    Assert.assertEquals(task.getDataSource(), task2.getDataSource());
-    Assert.assertEquals(task.getTaskResource().getRequiredCapacity(), task2.getTaskResource().getRequiredCapacity());
-    Assert.assertEquals(task.getTaskResource().getAvailabilityGroup(), task2.getTaskResource().getAvailabilityGroup());
-    Assert.assertEquals(
-        task.getRealtimeIngestionSchema().getTuningConfig().getWindowPeriod(),
-        task2.getRealtimeIngestionSchema().getTuningConfig().getWindowPeriod()
-    );
-    Assert.assertEquals(
-        task.getRealtimeIngestionSchema().getTuningConfig().getMaxBytesInMemory(),
-        task2.getRealtimeIngestionSchema().getTuningConfig().getMaxBytesInMemory()
-    );
-    Assert.assertEquals(
-        task.getRealtimeIngestionSchema().getDataSchema().getGranularitySpec().getSegmentGranularity(),
-        task2.getRealtimeIngestionSchema().getDataSchema().getGranularitySpec().getSegmentGranularity()
-    );
-  }
-
   @Test
   public void testArchiveTaskSerde() throws Exception
   {
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TestAppenderatorsManager.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TestAppenderatorsManager.java
index 515b9f350ef..e6186329126 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TestAppenderatorsManager.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TestAppenderatorsManager.java
@@ -38,7 +38,7 @@ import org.apache.druid.segment.join.JoinableFactory;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.Appenderator;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorConfig;
 import org.apache.druid.segment.realtime.appenderator.Appenderators;
@@ -56,7 +56,7 @@ public class TestAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -105,7 +105,7 @@ public class TestAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -137,7 +137,7 @@ public class TestAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -169,7 +169,7 @@ public class TestAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/overlord/TaskLifecycleTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/overlord/TaskLifecycleTest.java
index f8f9806abde..91d74a2bd67 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/overlord/TaskLifecycleTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/overlord/TaskLifecycleTest.java
@@ -47,9 +47,7 @@ import org.apache.druid.data.input.InputStats;
 import org.apache.druid.data.input.MapBasedInputRow;
 import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.data.input.impl.InputRowParser;
-import org.apache.druid.data.input.impl.MapInputRowParser;
 import org.apache.druid.data.input.impl.NoopInputFormat;
-import org.apache.druid.data.input.impl.TimeAndDimsParseSpec;
 import org.apache.druid.data.input.impl.TimestampSpec;
 import org.apache.druid.discovery.DataNodeService;
 import org.apache.druid.discovery.DruidNodeAnnouncer;
@@ -83,7 +81,6 @@ import org.apache.druid.indexing.common.task.KillUnusedSegmentsTask;
 import org.apache.druid.indexing.common.task.NoopTask;
 import org.apache.druid.indexing.common.task.NoopTaskContextEnricher;
 import org.apache.druid.indexing.common.task.NoopTestTaskReportFileWriter;
-import org.apache.druid.indexing.common.task.RealtimeIndexTask;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.indexing.common.task.TaskResource;
 import org.apache.druid.indexing.common.task.TestAppenderatorsManager;
@@ -103,15 +100,12 @@ import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.Pair;
 import org.apache.druid.java.util.common.RE;
 import org.apache.druid.java.util.common.Stopwatch;
-import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.concurrent.Execs;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.java.util.common.guava.Comparators;
-import org.apache.druid.java.util.common.jackson.JacksonUtils;
 import org.apache.druid.java.util.common.parsers.CloseableIterator;
 import org.apache.druid.java.util.emitter.EmittingLogger;
 import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.java.util.metrics.Monitor;
 import org.apache.druid.java.util.metrics.MonitorScheduler;
 import org.apache.druid.metadata.DerbyMetadataStorageActionHandlerFactory;
 import org.apache.druid.metadata.TestDerbyConnector;
@@ -121,18 +115,14 @@ import org.apache.druid.query.QueryRunnerFactoryConglomerate;
 import org.apache.druid.query.SegmentDescriptor;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.aggregation.DoubleSumAggregatorFactory;
-import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
 import org.apache.druid.segment.IndexIO;
 import org.apache.druid.segment.IndexMergerV9Factory;
 import org.apache.druid.segment.IndexSpec;
 import org.apache.druid.segment.SegmentSchemaMapping;
-import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.TestIndex;
 import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
 import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.join.JoinableFactoryWrapperTest;
 import org.apache.druid.segment.join.NoopJoinableFactory;
@@ -141,8 +131,6 @@ import org.apache.druid.segment.loading.LocalDataSegmentKiller;
 import org.apache.druid.segment.loading.LocalDataSegmentPusherConfig;
 import org.apache.druid.segment.loading.NoopDataSegmentArchiver;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.apache.druid.segment.realtime.FireDepartmentTest;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorsManager;
 import org.apache.druid.segment.realtime.appenderator.UnifiedIndexerAppenderatorsManager;
 import org.apache.druid.segment.realtime.firehose.NoopChatHandlerProvider;
@@ -651,7 +639,7 @@ public class TaskLifecycleTest extends InitializedNullHandlingTest
         MAPPER,
         INDEX_IO,
         MapCache.create(0),
-        FireDepartmentTest.NO_CACHE_CONFIG,
+        new CacheConfig(),
         new CachePopulatorStats(),
         INDEX_MERGER_V9_FACTORY,
         EasyMock.createNiceMock(DruidNodeAnnouncer.class),
@@ -1251,114 +1239,6 @@ public class TaskLifecycleTest extends InitializedNullHandlingTest
     Assert.assertEquals("segments nuked", 0, mdc.getNuked().size());
   }
 
-  @Test(timeout = 60_000L)
-  public void testRealtimeIndexTask() throws Exception
-  {
-    publishCountDown = new CountDownLatch(1);
-    monitorScheduler.addMonitor(EasyMock.anyObject(Monitor.class));
-    EasyMock.expectLastCall().times(1);
-    monitorScheduler.removeMonitor(EasyMock.anyObject(Monitor.class));
-    EasyMock.expectLastCall().times(1);
-    EasyMock.replay(monitorScheduler, queryRunnerFactoryConglomerate);
-
-    RealtimeIndexTask realtimeIndexTask = newRealtimeIndexTask();
-    final String taskId = realtimeIndexTask.getId();
-
-    taskQueue.start();
-    taskQueue.add(realtimeIndexTask);
-    //wait for task to process events and publish segment
-    publishCountDown.await();
-
-    // Realtime Task has published the segment, simulate loading of segment to a historical node so that task finishes with SUCCESS status
-    Assert.assertEquals(1, handOffCallbacks.size());
-    Pair<Executor, Runnable> executorRunnablePair = Iterables.getOnlyElement(handOffCallbacks.values());
-    executorRunnablePair.lhs.execute(executorRunnablePair.rhs);
-    handOffCallbacks.clear();
-
-    // Wait for realtime index task to handle callback in plumber and succeed
-    while (tsqa.getStatus(taskId).get().isRunnable()) {
-      Thread.sleep(10);
-    }
-
-    TaskStatus status = tsqa.getStatus(taskId).get();
-    Assert.assertTrue("Task should be in Success state", status.isSuccess());
-    Assert.assertEquals(taskLocation, status.getLocation());
-
-    Assert.assertEquals(1, announcedSinks);
-    Assert.assertEquals(1, pushedSegments);
-    Assert.assertEquals(1, mdc.getPublished().size());
-    DataSegment segment = mdc.getPublished().iterator().next();
-    Assert.assertEquals("test_ds", segment.getDataSource());
-    Assert.assertEquals(ImmutableList.of("dim1", "dim2"), segment.getDimensions());
-    Assert.assertEquals(
-        Intervals.of(now.toString("YYYY-MM-dd") + "/" + now.plusDays(1).toString("YYYY-MM-dd")),
-        segment.getInterval()
-    );
-    Assert.assertEquals(ImmutableList.of("count"), segment.getMetrics());
-    EasyMock.verify(monitorScheduler, queryRunnerFactoryConglomerate);
-  }
-
-  @Test(timeout = 60_000L)
-  public void testRealtimeIndexTaskFailure() throws Exception
-  {
-    dataSegmentPusher = new DataSegmentPusher()
-    {
-      @Deprecated
-      @Override
-      public String getPathForHadoop(String s)
-      {
-        return getPathForHadoop();
-      }
-
-      @Override
-      public String getPathForHadoop()
-      {
-        throw new UnsupportedOperationException();
-      }
-
-      @Override
-      public DataSegment push(File file, DataSegment dataSegment, boolean useUniquePath)
-      {
-        throw new RuntimeException("FAILURE");
-      }
-
-      @Override
-      public Map<String, Object> makeLoadSpec(URI uri)
-      {
-        throw new UnsupportedOperationException();
-      }
-    };
-
-    tb = setUpTaskToolboxFactory(dataSegmentPusher, handoffNotifierFactory, mdc);
-
-    taskRunner = setUpThreadPoolTaskRunner(tb);
-
-    taskQueue = setUpTaskQueue(taskStorage, taskRunner);
-
-    monitorScheduler.addMonitor(EasyMock.anyObject(Monitor.class));
-    EasyMock.expectLastCall().times(1);
-    monitorScheduler.removeMonitor(EasyMock.anyObject(Monitor.class));
-    EasyMock.expectLastCall().times(1);
-    EasyMock.replay(monitorScheduler, queryRunnerFactoryConglomerate);
-
-    RealtimeIndexTask realtimeIndexTask = newRealtimeIndexTask();
-    final String taskId = realtimeIndexTask.getId();
-
-    taskQueue.start();
-    taskQueue.add(realtimeIndexTask);
-
-    // Wait for realtime index task to fail
-    while (tsqa.getStatus(taskId).get().isRunnable()) {
-      Thread.sleep(10);
-    }
-
-    TaskStatus status = tsqa.getStatus(taskId).get();
-    Assert.assertTrue("Task should be in Failure state", status.isFailure());
-    Assert.assertEquals(taskLocation, status.getLocation());
-
-    EasyMock.verify(monitorScheduler, queryRunnerFactoryConglomerate);
-  }
-
   @Test
   public void testResumeTasks() throws Exception
   {
@@ -1629,60 +1509,4 @@ public class TaskLifecycleTest extends InitializedNullHandlingTest
 
     return retVal;
   }
-
-  private RealtimeIndexTask newRealtimeIndexTask()
-  {
-    String taskId = StringUtils.format("rt_task_%s", System.currentTimeMillis());
-    DataSchema dataSchema = new DataSchema(
-        "test_ds",
-        TestHelper.makeJsonMapper().convertValue(
-            new MapInputRowParser(
-                new TimeAndDimsParseSpec(
-                    new TimestampSpec(null, null, null),
-                    DimensionsSpec.EMPTY
-                )
-            ),
-            JacksonUtils.TYPE_REFERENCE_MAP_STRING_OBJECT
-        ),
-        new AggregatorFactory[]{new LongSumAggregatorFactory("count", "rows")},
-        new UniformGranularitySpec(Granularities.DAY, Granularities.NONE, null),
-        null,
-        mapper
-    );
-    RealtimeIOConfig realtimeIOConfig = new RealtimeIOConfig(
-        new MockFirehoseFactory(),
-        null
-        // PlumberSchool - Realtime Index Task always uses RealtimePlumber which is hardcoded in RealtimeIndexTask class
-    );
-    RealtimeTuningConfig realtimeTuningConfig = new RealtimeTuningConfig(
-        null,
-        1000,
-        null,
-        null,
-        new Period("P1Y"),
-        null, //default window period of 10 minutes
-        null, // base persist dir ignored by Realtime Index task
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        0,
-        0,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    FireDepartment fireDepartment = new FireDepartment(dataSchema, realtimeIOConfig, realtimeTuningConfig);
-    return new RealtimeIndexTask(
-        taskId,
-        new TaskResource(taskId, 1),
-        fireDepartment,
-        null
-    );
-  }
 }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/worker/TaskAnnouncementTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/worker/TaskAnnouncementTest.java
index c61bb40bfd7..ca3cd6edf8b 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/worker/TaskAnnouncementTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/worker/TaskAnnouncementTest.java
@@ -20,18 +20,16 @@
 package org.apache.druid.indexing.worker;
 
 import com.fasterxml.jackson.databind.ObjectMapper;
+import org.apache.druid.data.input.impl.NoopInputSource;
 import org.apache.druid.indexer.TaskLocation;
 import org.apache.druid.indexer.TaskStatus;
 import org.apache.druid.indexing.common.TestUtils;
-import org.apache.druid.indexing.common.task.RealtimeIndexTask;
+import org.apache.druid.indexing.common.task.IndexTask;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.indexing.common.task.TaskResource;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.realtime.FireDepartment;
-import org.easymock.EasyMock;
 import org.junit.Assert;
 import org.junit.Test;
 
@@ -48,13 +46,13 @@ public class TaskAnnouncementTest
   @Test
   public void testBackwardsCompatibleSerde() throws Exception
   {
-    final RealtimeIOConfig realtimeIOConfig = EasyMock.createNiceMock(RealtimeIOConfig.class);
-    final Task task = new RealtimeIndexTask(
+    final IndexTask.IndexIOConfig ioConfig = new IndexTask.IndexIOConfig(null, new NoopInputSource(), null, null, null);
+    final Task task = new IndexTask(
         "theid",
         new TaskResource("rofl", 2),
-        new FireDepartment(
+        new IndexTask.IndexIngestionSpec(
             new DataSchema("foo", null, new AggregatorFactory[0], null, null, new DefaultObjectMapper()),
-            realtimeIOConfig,
+            ioConfig,
             null
         ),
         null
diff --git a/integration-tests-ex/cases/cluster.sh b/integration-tests-ex/cases/cluster.sh
index 1ff1cdf1307..bc626a559c4 100755
--- a/integration-tests-ex/cases/cluster.sh
+++ b/integration-tests-ex/cases/cluster.sh
@@ -252,7 +252,7 @@ case $CMD in
     cd $COMPOSE_DIR
     $DOCKER_COMPOSE $DOCKER_ARGS up -d
     # Enable the following for debugging
-    #show_status
+    # show_status
     ;;
   "status" )
     check_env_file
diff --git a/integration-tests-ex/cases/cluster/Common/dependencies.yaml b/integration-tests-ex/cases/cluster/Common/dependencies.yaml
index 10b01c46896..0409c30bf53 100644
--- a/integration-tests-ex/cases/cluster/Common/dependencies.yaml
+++ b/integration-tests-ex/cases/cluster/Common/dependencies.yaml
@@ -46,28 +46,27 @@ services:
   kafka:
     image: bitnami/kafka:${KAFKA_VERSION}
     container_name: kafka
+    # platform: linux/x86_64
     labels:
       druid-int-test: "true"
     ports:
       - 9092:9092
-      - 9093:9093
+      - 9094:9094
     networks:
       druid-it-net:
         ipv4_address: 172.172.172.2
     volumes:
       - ${SHARED_DIR}/kafka:/bitnami/kafka
     environment:
-      # This is the default: making it explicit
-      KAFKA_CFG_ZOOKEEPER_CONNECT: zookeeper:2181
-      # Plaintext is disabled by default
-      ALLOW_PLAINTEXT_LISTENER: "yes"
-      # Adapted from base-setup.sh and Bitnami docs
-      KAFKA_CFG_LISTENER_SECURITY_PROTOCOL_MAP: "INTERNAL:PLAINTEXT,EXTERNAL:PLAINTEXT"
-      KAFKA_CFG_LISTENERS: "INTERNAL://:9092,EXTERNAL://:9093"
-      KAFKA_CFG_ADVERTISED_LISTENERS: "INTERNAL://kafka:9092,EXTERNAL://localhost:9093"
-      KAFKA_CFG_INTER_BROKER_LISTENER_NAME: INTERNAL
-    depends_on:
-      - zookeeper
+      - KAFKA_CFG_NODE_ID=1001
+      - KAFKA_CFG_PROCESS_ROLES=controller,broker
+      - KAFKA_CFG_LISTENERS=PLAINTEXT://:9092,CONTROLLER://:9093
+      - KAFKA_CFG_LISTENER_SECURITY_PROTOCOL_MAP=CONTROLLER:PLAINTEXT,PLAINTEXT:PLAINTEXT
+      - KAFKA_CFG_CONTROLLER_QUORUM_VOTERS=1001@kafka:9093
+      - KAFKA_CFG_LISTENERS=PLAINTEXT://:9092,CONTROLLER://:9093,EXTERNAL://:9094
+      - KAFKA_CFG_ADVERTISED_LISTENERS=PLAINTEXT://kafka:9092,EXTERNAL://localhost:9094
+      - KAFKA_CFG_LISTENER_SECURITY_PROTOCOL_MAP=CONTROLLER:PLAINTEXT,EXTERNAL:PLAINTEXT,PLAINTEXT:PLAINTEXT
+      - KAFKA_CFG_CONTROLLER_LISTENER_NAMES=CONTROLLER
 
   # Uses the official MySQL image
   # See https://hub.docker.com/_/mysql
diff --git a/integration-tests-ex/cases/cluster/Query/docker-compose.yaml b/integration-tests-ex/cases/cluster/Query/docker-compose.yaml
new file mode 100644
index 00000000000..0b7c461e126
--- /dev/null
+++ b/integration-tests-ex/cases/cluster/Query/docker-compose.yaml
@@ -0,0 +1,105 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+networks:
+  druid-it-net:
+    name: druid-it-net
+    ipam:
+      config:
+        - subnet: 172.172.172.0/24
+
+services:
+  zookeeper:
+    extends:
+      file: ../Common/dependencies.yaml
+      service: zookeeper
+
+  metadata:
+    extends:
+      file: ../Common/dependencies.yaml
+      service: metadata
+
+  coordinator:
+    extends:
+      file: ../Common/druid.yaml
+      service: coordinator
+    container_name: coordinator
+    environment:
+      - DRUID_INTEGRATION_TEST_GROUP=${DRUID_INTEGRATION_TEST_GROUP}
+      # The frequency with which the coordinator polls the database
+      # for changes. The DB population code has to wait at least this
+      # long for the coordinator to notice changes.
+      - druid_manager_segments_pollDuration=PT5S
+      - druid_coordinator_period=PT10S
+    depends_on:
+      - zookeeper
+      - metadata
+
+  overlord:
+    extends:
+      file: ../Common/druid.yaml
+      service: overlord
+    container_name: overlord
+    environment:
+      - DRUID_INTEGRATION_TEST_GROUP=${DRUID_INTEGRATION_TEST_GROUP}
+    depends_on:
+      - zookeeper
+      - metadata
+
+  broker:
+    extends:
+      file: ../Common/druid.yaml
+      service: broker
+    environment:
+      - DRUID_INTEGRATION_TEST_GROUP=${DRUID_INTEGRATION_TEST_GROUP}
+    depends_on:
+      - zookeeper
+
+  router:
+    extends:
+      file: ../Common/druid.yaml
+      service: router
+    environment:
+      - DRUID_INTEGRATION_TEST_GROUP=${DRUID_INTEGRATION_TEST_GROUP}
+    depends_on:
+      - zookeeper
+
+  historical:
+    extends:
+      file: ../Common/druid.yaml
+      service: historical
+    environment:
+      - DRUID_INTEGRATION_TEST_GROUP=${DRUID_INTEGRATION_TEST_GROUP}
+    depends_on:
+      - zookeeper
+
+  middlemanager:
+    extends:
+      file: ../Common/druid.yaml
+      service: middlemanager
+    environment:
+      - DRUID_INTEGRATION_TEST_GROUP=${DRUID_INTEGRATION_TEST_GROUP}
+    volumes:
+      # Test data
+      - ../../resources:/resources
+    depends_on:
+      - zookeeper
+
+  kafka:
+    extends:
+      file: ../Common/dependencies.yaml
+      service: kafka
+    depends_on:
+      - zookeeper
diff --git a/integration-tests-ex/cases/pom.xml b/integration-tests-ex/cases/pom.xml
index 2ec2eabc3b3..5e38ac407f8 100644
--- a/integration-tests-ex/cases/pom.xml
+++ b/integration-tests-ex/cases/pom.xml
@@ -74,6 +74,11 @@
             <artifactId>druid-indexing-service</artifactId>
             <version>${project.parent.version}</version>
         </dependency>
+        <dependency>
+            <groupId>org.apache.druid.extensions</groupId>
+            <artifactId>druid-kafka-indexing-service</artifactId>
+            <version>${project.parent.version}</version>
+        </dependency>
         <dependency>
             <groupId>com.google.inject</groupId>
             <artifactId>guice</artifactId>
@@ -399,6 +404,15 @@
                 <it.category>AzureDeepStorage</it.category>
             </properties>
         </profile>
+        <profile>
+            <id>IT-Query</id>
+            <activation>
+                <activeByDefault>false</activeByDefault>
+            </activation>
+            <properties>
+                <it.category>Query</it.category>
+            </properties>
+        </profile>
         <profile>
             <id>IT-MultiStageQuery</id>
             <activation>
diff --git a/server/src/main/java/org/apache/druid/metadata/MetadataSegmentPublisher.java b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/categories/Query.java
similarity index 83%
rename from server/src/main/java/org/apache/druid/metadata/MetadataSegmentPublisher.java
rename to integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/categories/Query.java
index 34f98e8e381..252d1325f03 100644
--- a/server/src/main/java/org/apache/druid/metadata/MetadataSegmentPublisher.java
+++ b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/categories/Query.java
@@ -17,10 +17,8 @@
  * under the License.
  */
 
-package org.apache.druid.metadata;
+package org.apache.druid.testsEx.categories;
 
-import org.apache.druid.segment.realtime.SegmentPublisher;
-
-public interface MetadataSegmentPublisher extends SegmentPublisher
+public class Query
 {
 }
diff --git a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/config/IntegrationTestingConfigEx.java b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/config/IntegrationTestingConfigEx.java
index e23c996c884..0725a09fd91 100644
--- a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/config/IntegrationTestingConfigEx.java
+++ b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/config/IntegrationTestingConfigEx.java
@@ -62,13 +62,13 @@ class IntegrationTestingConfigEx implements IntegrationTestingConfig
   @Override
   public String getKafkaHost()
   {
-    return config.requireKafka().instance().clientHost();
+    return config.requireKafka().instance().clientHost() + ":" + config.requireKafka().instance().clientPort();
   }
 
   @Override
   public String getKafkaInternalHost()
   {
-    return config.requireKafka().instance().host();
+    return config.requireKafka().instance().host() + ":" + config.requireKafka().instance().port();
   }
 
   @Override
diff --git a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/query/ITUnionQueryTest.java b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/query/ITUnionQueryTest.java
new file mode 100644
index 00000000000..2d0d8e4f50e
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/query/ITUnionQueryTest.java
@@ -0,0 +1,213 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.testsEx.query;
+
+import org.apache.druid.indexing.kafka.KafkaConsumerConfigs;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
+import org.apache.druid.testing.IntegrationTestingConfig;
+import org.apache.druid.testing.utils.ITRetryUtil;
+import org.apache.druid.testing.utils.KafkaAdminClient;
+import org.apache.druid.testing.utils.KafkaEventWriter;
+import org.apache.druid.testing.utils.KafkaUtil;
+import org.apache.druid.testing.utils.StreamEventWriter;
+import org.apache.druid.testsEx.categories.Query;
+import org.apache.druid.testsEx.config.DruidTestRunner;
+import org.apache.druid.testsEx.indexer.AbstractIndexerTest;
+import org.joda.time.Interval;
+import org.junit.Test;
+import org.junit.experimental.categories.Category;
+import org.junit.runner.RunWith;
+
+import java.io.BufferedReader;
+import java.io.InputStreamReader;
+import java.nio.charset.StandardCharsets;
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.List;
+import java.util.Map;
+import java.util.Properties;
+import java.util.UUID;
+import java.util.function.Function;
+
+@RunWith(DruidTestRunner.class)
+@Category(Query.class)
+public class ITUnionQueryTest extends AbstractIndexerTest
+{
+  private static final Logger LOG = new Logger(ITUnionQueryTest.class);
+  private static final String UNION_SUPERVISOR_TEMPLATE = "/query/union_kafka_supervisor_template.json";
+  private static final String UNION_DATA_FILE = "/query/union_data.json";
+  private static final String UNION_QUERIES_RESOURCE = "/query/union_queries.json";
+  private static final String UNION_DATASOURCE = "wikipedia_index_test";
+  private String fullDatasourceName;
+
+  @Test
+  public void testUnionQuery() throws Exception
+  {
+    fullDatasourceName = UNION_DATASOURCE + config.getExtraDatasourceNameSuffix();
+    final String baseName = fullDatasourceName + UUID.randomUUID();
+    KafkaAdminClient streamAdminClient = new KafkaAdminClient(config);
+    List<String> supervisors = new ArrayList<>();
+
+    final int numDatasources = 3;
+    for (int i = 0; i < numDatasources; i++) {
+      String datasource = baseName + "-" + i;
+      streamAdminClient.createStream(datasource, 1, Collections.emptyMap());
+      ITRetryUtil.retryUntil(
+          () -> streamAdminClient.isStreamActive(datasource),
+          true,
+          10000,
+          30,
+          "Wait for stream active"
+      );
+      String supervisorSpec = generateStreamIngestionPropsTransform(
+          datasource,
+          datasource,
+          config
+      ).apply(getResourceAsString(UNION_SUPERVISOR_TEMPLATE));
+      LOG.info("supervisorSpec: [%s]\n", supervisorSpec);
+      // Start supervisor
+      String specResponse = indexer.submitSupervisor(supervisorSpec);
+      LOG.info("Submitted supervisor [%s]", specResponse);
+      supervisors.add(specResponse);
+
+      int ctr = 0;
+      try (
+          StreamEventWriter streamEventWriter = new KafkaEventWriter(config, false);
+          BufferedReader reader = new BufferedReader(
+              new InputStreamReader(getResourceAsStream(UNION_DATA_FILE), StandardCharsets.UTF_8)
+          )
+      ) {
+        String line;
+        while ((line = reader.readLine()) != null) {
+          streamEventWriter.write(datasource, StringUtils.toUtf8(line));
+          ctr++;
+        }
+      }
+      final int numWritten = ctr;
+
+      LOG.info("Waiting for stream indexing tasks to consume events");
+
+      ITRetryUtil.retryUntilTrue(
+          () ->
+              numWritten == this.queryHelper.countRows(
+                  datasource,
+                  Intervals.ETERNITY,
+                  name -> new LongSumAggregatorFactory(name, "count")
+              ),
+          StringUtils.format(
+              "dataSource[%s] consumed [%,d] events, expected [%,d]",
+              datasource,
+              this.queryHelper.countRows(
+                  datasource,
+                  Intervals.ETERNITY,
+                  name -> new LongSumAggregatorFactory(name, "count")
+              ),
+              numWritten
+          )
+      );
+    }
+
+    String queryResponseTemplate = StringUtils.replace(
+        getResourceAsString(UNION_QUERIES_RESOURCE),
+        "%%DATASOURCE%%",
+        baseName
+    );
+
+    queryHelper.testQueriesFromString(queryResponseTemplate);
+
+
+    for (int i = 0; i < numDatasources; i++) {
+      indexer.terminateSupervisor(supervisors.get(i));
+      streamAdminClient.deleteStream(baseName + "-" + i);
+    }
+
+    for (int i = 0; i < numDatasources; i++) {
+      final int datasourceNumber = i;
+      ITRetryUtil.retryUntil(
+          () -> coordinator.areSegmentsLoaded(baseName + "-" + datasourceNumber),
+          true,
+          10000,
+          10,
+          "Kafka segments loaded"
+      );
+    }
+
+    queryHelper.testQueriesFromString(queryResponseTemplate);
+
+    for (int i = 0; i < numDatasources; i++) {
+      final String datasource = baseName + "-" + i;
+      List<String> intervals = coordinator.getSegmentIntervals(datasource);
+
+      Collections.sort(intervals);
+      String first = intervals.get(0).split("/")[0];
+      String last = intervals.get(intervals.size() - 1).split("/")[1];
+      Interval interval = Intervals.of(first + "/" + last);
+      coordinator.unloadSegmentsForDataSource(baseName + "-" + i);
+      ITRetryUtil.retryUntilFalse(
+          () -> coordinator.areSegmentsLoaded(datasource),
+          "Segment Unloading"
+      );
+      coordinator.deleteSegmentsDataSource(baseName + "-" + i, interval);
+    }
+  }
+
+
+  /**
+   * sad version of
+   * {@link org.apache.druid.tests.indexer.AbstractKafkaIndexingServiceTest#generateStreamIngestionPropsTransform}
+   */
+  private Function<String, String> generateStreamIngestionPropsTransform(
+      String streamName,
+      String fullDatasourceName,
+      IntegrationTestingConfig config
+  )
+  {
+    final Map<String, Object> consumerConfigs = KafkaConsumerConfigs.getConsumerProperties();
+    final Properties consumerProperties = new Properties();
+    consumerProperties.putAll(consumerConfigs);
+    consumerProperties.setProperty("bootstrap.servers", config.getKafkaInternalHost());
+    KafkaUtil.addPropertiesFromTestConfig(config, consumerProperties);
+    return spec -> {
+      try {
+        spec = StringUtils.replace(
+            spec,
+            "%%DATASOURCE%%",
+            fullDatasourceName
+        );
+        spec = StringUtils.replace(
+            spec,
+            "%%TOPIC_VALUE%%",
+            streamName
+        );
+        return StringUtils.replace(
+            spec,
+            "%%STREAM_PROPERTIES_VALUE%%",
+            jsonMapper.writeValueAsString(consumerProperties)
+        );
+      }
+      catch (Exception e) {
+        throw new RuntimeException(e);
+      }
+    };
+  }
+}
diff --git a/integration-tests-ex/cases/src/test/resources/cluster/Common/kafka.yaml b/integration-tests-ex/cases/src/test/resources/cluster/Common/kafka.yaml
index 769c80989a4..5722cd72072 100644
--- a/integration-tests-ex/cases/src/test/resources/cluster/Common/kafka.yaml
+++ b/integration-tests-ex/cases/src/test/resources/cluster/Common/kafka.yaml
@@ -19,4 +19,4 @@
 kafka:
   instances:
     - port: 9092
-      proxyPort: 9093
+      proxyPort: 9094
diff --git a/integration-tests-ex/cases/src/test/resources/cluster/Query/docker.yaml b/integration-tests-ex/cases/src/test/resources/cluster/Query/docker.yaml
new file mode 100644
index 00000000000..e217490df5d
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/cluster/Query/docker.yaml
@@ -0,0 +1,199 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#-------------------------------------------------------------------------
+
+# Definition of the query test cluster.
+# See https://yaml.org/spec/1.2.2 for more about YAML
+include:
+  - /cluster/Common/zk-metastore.yaml
+  - /cluster/Common/kafka.yaml
+
+druid:
+  coordinator:
+    instances:
+      - port: 8081
+  overlord:
+    instances:
+      - port: 8090
+  broker:
+    instances:
+      - port: 8082
+  router:
+    instances:
+      - port: 8888
+  historical:
+    instances:
+      - port: 8083
+  middlemanager:
+    instances:
+      - port: 8091
+
+# Metastore initialization queries.
+# REPLACE is used so that the statements are idempotent
+# The fancy formatting is for human consumption, it is compacted internally
+metastoreInit:
+  - sql: |
+      REPLACE INTO druid_segments (
+        id, dataSource, created_date, start, end, partitioned, version, used, payload
+      )
+      VALUES (
+        'twitterstream_2013-01-01T00:00:00.000Z_2013-01-02T00:00:00.000Z_2013-01-02T04:13:41.980Z_v9',
+        'twitterstream',
+        '2013-05-13T01:08:18.192Z',
+        '2013-01-01T00:00:00.000Z',
+        '2013-01-02T00:00:00.000Z',
+        0,
+        '2013-01-02T04:13:41.980Z_v9',
+        1,
+        '{"dataSource": "twitterstream",
+          "interval": "2013-01-01T00:00:00.000Z/2013-01-02T00:00:00.000Z",
+          "version": "2013-01-02T04:13:41.980Z_v9",
+          "loadSpec": {
+            "type": "s3_zip",
+            "bucket": "static.druid.io",
+            "key": "data/segments/twitterstream/2013-01-01T00:00:00.000Z_2013-01-02T00:00:00.000Z/2013-01-02T04:13:41.980Z_v9/0/index.zip"
+          },
+          "dimensions": "has_links,first_hashtag,user_time_zone,user_location,has_mention,user_lang,
+            rt_name,user_name,is_retweet,is_viral,has_geo,url_domain,user_mention_name,reply_to_name",
+          "metrics": "count,tweet_length,num_followers,num_links,num_mentions,num_hashtags,num_favorites,user_total_tweets",
+          "shardSpec": {"type": "none"},
+          "binaryVersion": 9,
+          "size": 445235220,
+          "identifier": "twitterstream_2013-01-01T00:00:00.000Z_2013-01-02T00:00:00.000Z_2013-01-02T04:13:41.980Z_v9"
+        }'
+      )
+
+  - sql: |
+      REPLACE INTO druid_segments (
+        id, dataSource, created_date, start, end, partitioned, version, used, payload
+      )
+      VALUES (
+        'twitterstream_2013-01-02T00:00:00.000Z_2013-01-03T00:00:00.000Z_2013-01-03T03:44:58.791Z_v9',
+        'twitterstream',
+        '2013-05-13T00:03:28.640Z',
+        '2013-01-02T00:00:00.000Z',
+        '2013-01-03T00:00:00.000Z',
+        0,
+        '2013-01-03T03:44:58.791Z_v9',
+        1,
+        '{"dataSource": "twitterstream",
+          "interval": "2013-01-02T00:00:00.000Z/2013-01-03T00:00:00.000Z",
+          "version": "2013-01-03T03:44:58.791Z_v9",
+          "loadSpec": {
+            "type": "s3_zip",
+            "bucket": "static.druid.io",
+            "key": "data/segments/twitterstream/2013-01-02T00:00:00.000Z_2013-01-03T00:00:00.000Z/2013-01-03T03:44:58.791Z_v9/0/index.zip"
+          },
+          "dimensions": "has_links,first_hashtag,user_time_zone,user_location,has_mention,user_lang,
+            rt_name,user_name,is_retweet,is_viral,has_geo,url_domain,user_mention_name,reply_to_name",
+          "metrics": "count,tweet_length,num_followers,num_links,num_mentions,num_hashtags,num_favorites,user_total_tweets",
+          "shardSpec": {"type": "none"},
+          "binaryVersion": 9,
+          "size": 435325540,
+          "identifier": "twitterstream_2013-01-02T00:00:00.000Z_2013-01-03T00:00:00.000Z_2013-01-03T03:44:58.791Z_v9"
+        }'
+      )
+
+  - sql: |
+      REPLACE INTO druid_segments (
+        id, dataSource, created_date, start, end, partitioned, version, used, payload
+      )
+      VALUES (
+        'twitterstream_2013-01-03T00:00:00.000Z_2013-01-04T00:00:00.000Z_2013-01-04T04:09:13.590Z_v9',
+        'twitterstream',
+        '2013-05-13T00:03:48.807Z',
+        '2013-01-03T00:00:00.000Z',
+        '2013-01-04T00:00:00.000Z',
+        0,
+        '2013-01-04T04:09:13.590Z_v9',
+        1,
+        '{"dataSource": "twitterstream",
+          "interval": "2013-01-03T00:00:00.000Z/2013-01-04T00:00:00.000Z",
+          "version": "2013-01-04T04:09:13.590Z_v9",
+          "loadSpec": {
+            "type": "s3_zip",
+            "bucket": "static.druid.io",
+            "key": "data/segments/twitterstream/2013-01-03T00:00:00.000Z_2013-01-04T00:00:00.000Z/2013-01-04T04:09:13.590Z_v9/0/index.zip"
+          },
+          "dimensions": "has_links,first_hashtag,user_time_zone,user_location,has_mention,user_lang,
+            rt_name,user_name,is_retweet,is_viral,has_geo,url_domain,user_mention_name,reply_to_name",
+          "metrics": "count,tweet_length,num_followers,num_links,num_mentions,num_hashtags,num_favorites,user_total_tweets",
+          "shardSpec": {"type": "none"},
+          "binaryVersion": 9,
+          "size": 411651320,
+          "identifier": "twitterstream_2013-01-03T00:00:00.000Z_2013-01-04T00:00:00.000Z_2013-01-04T04:09:13.590Z_v9"
+        }'
+      )
+
+  - sql: |
+      REPLACE INTO druid_segments (
+        id, dataSource, created_date, start, end, partitioned, version, used, payload
+      )
+      VALUES (
+        'wikipedia_editstream_2012-12-29T00:00:00.000Z_2013-01-10T08:00:00.000Z_2013-01-10T08:13:47.830Z_v9',
+        'wikipedia_editstream',
+        '2013-03-15T20:49:52.348Z',
+        '2012-12-29T00:00:00.000Z',
+        '2013-01-10T08:00:00.000Z',
+        0,
+        '2013-01-10T08:13:47.830Z_v9',
+        1,
+        '{"dataSource": "wikipedia_editstream",
+          "interval": "2012-12-29T00:00:00.000Z/2013-01-10T08:00:00.000Z",
+          "version": "2013-01-10T08:13:47.830Z_v9",
+          "loadSpec": {
+            "type": "s3_zip",
+            "bucket": "static.druid.io",
+            "key": "data/segments/wikipedia_editstream/2012-12-29T00:00:00.000Z_2013-01-10T08:00:00.000Z/2013-01-10T08:13:47.830Z_v9/0/index.zip"},
+          "dimensions": "anonymous,area_code,city,continent_code,country_name,dma_code,geo,language,
+            namespace,network,newpage,page,postal_code,region_lookup,robot,unpatrolled,user",
+          "metrics": "added,count,deleted,delta,delta_hist,unique_users,variation",
+          "shardSpec": {"type": "none"},
+          "binaryVersion": 9,
+          "size": 446027801,
+          "identifier": "wikipedia_editstream_2012-12-29T00:00:00.000Z_2013-01-10T08:00:00.000Z_2013-01-10T08:13:47.830Z_v9"
+        }'
+      )
+
+  - sql: |
+      REPLACE INTO druid_segments (
+        id, dataSource, created_date, start, end, partitioned, version, used, payload
+      )
+      VALUES (
+        'wikipedia_2013-08-01T00:00:00.000Z_2013-08-02T00:00:00.000Z_2013-08-08T21:22:48.989Z',
+        'wikipedia',
+        '2013-08-08T21:26:23.799Z',
+        '2013-08-01T00:00:00.000Z',
+        '2013-08-02T00:00:00.000Z',
+        0,
+        '2013-08-08T21:22:48.989Z',
+        1,
+        '{"dataSource": "wikipedia",
+          "interval": "2013-08-01T00:00:00.000Z/2013-08-02T00:00:00.000Z",
+          "version": "2013-08-08T21:22:48.989Z",
+          "loadSpec": {
+            "type": "s3_zip",
+            "bucket": "static.druid.io",
+            "key": "data/segments/wikipedia/20130801T000000.000Z_20130802T000000.000Z/2013-08-08T21_22_48.989Z/0/index.zip"
+          },
+          "dimensions": "dma_code,continent_code,geo,area_code,robot,country_name,network,city,namespace,
+            anonymous,unpatrolled,page,postal_code,language,newpage,user,region_lookup",
+          "metrics": "count,delta,variation,added,deleted",
+          "shardSpec": {"type": "none"},
+          "binaryVersion": 9,
+          "size": 24664730,
+          "identifier": "wikipedia_2013-08-01T00:00:00.000Z_2013-08-02T00:00:00.000Z_2013-08-08T21:22:48.989Z"
+        }'
+      )
diff --git a/integration-tests-ex/cases/src/test/resources/indexer/broadcast_join_index_task.json b/integration-tests-ex/cases/src/test/resources/indexer/broadcast_join_index_task.json
index 20c3b162ea6..699ca547ff4 100644
--- a/integration-tests-ex/cases/src/test/resources/indexer/broadcast_join_index_task.json
+++ b/integration-tests-ex/cases/src/test/resources/indexer/broadcast_join_index_task.json
@@ -61,7 +61,7 @@
       "type": "index_parallel",
       "inputSource": {
         "type": "local",
-        "baseDir": "/resources/data/union_query/",
+        "baseDir": "/resources/data/broadcast/",
         "filter": "wikipedia_index_data*"
       },
       "appendToExisting": false,
diff --git a/integration-tests-ex/cases/src/test/resources/indexer/wikipedia_realtime_appenderator_index_task.json b/integration-tests-ex/cases/src/test/resources/indexer/wikipedia_realtime_appenderator_index_task.json
deleted file mode 100644
index 9e773609cb7..00000000000
--- a/integration-tests-ex/cases/src/test/resources/indexer/wikipedia_realtime_appenderator_index_task.json
+++ /dev/null
@@ -1,94 +0,0 @@
-{
-  "type": "index_realtime_appenderator",
-  "spec": {
-    "dataSchema": {
-      "dataSource": "%%DATASOURCE%%",
-      "metricsSpec": [
-        {
-          "type": "count",
-          "name": "count"
-        },
-        {
-          "type": "doubleSum",
-          "name": "added",
-          "fieldName": "added"
-        },
-        {
-          "type": "doubleSum",
-          "name": "deleted",
-          "fieldName": "deleted"
-        },
-        {
-          "type": "doubleSum",
-          "name": "delta",
-          "fieldName": "delta"
-        }
-      ],
-      "granularitySpec": {
-        "segmentGranularity": "minute",
-        "queryGranularity": "second"
-      },
-      "parser": {
-        "type": "map",
-        "parseSpec": {
-          "format": "tsv",
-          "columns": [
-            "timestamp",
-            "page",
-            "language",
-            "user",
-            "unpatrolled",
-            "newPage",
-            "robot",
-            "anonymous",
-            "namespace",
-            "continent",
-            "country",
-            "region",
-            "city",
-            "added",
-            "deleted",
-            "delta"
-          ],
-          "timestampSpec": {
-            "column": "timestamp",
-            "format": "iso"
-          },
-          "dimensionsSpec": {
-            "dimensions": [
-              "page",
-              "language",
-              "user",
-              "unpatrolled",
-              "newPage",
-              "robot",
-              "anonymous",
-              "namespace",
-              "continent",
-              "country",
-              "region",
-              "city"
-            ]
-          }
-        }
-      }
-    },
-    "ioConfig": {
-      "type": "realtime",
-      "firehose": {
-        "type": "timed",
-        "shutoffTime": "#SHUTOFFTIME",
-        "delegate": {
-          "type": "receiver",
-          "serviceName": "eventReceiverServiceName",
-          "bufferSize": 100000
-        }
-      }
-    },
-    "tuningConfig": {
-      "type": "realtime_appenderator",
-      "maxRowsInMemory": 1,
-      "intermediatePersistPeriod": "PT1M"
-    }
-  }
-}
diff --git a/integration-tests-ex/cases/src/test/resources/indexer/wikipedia_realtime_index_task.json b/integration-tests-ex/cases/src/test/resources/indexer/wikipedia_realtime_index_task.json
deleted file mode 100644
index 5f48162c488..00000000000
--- a/integration-tests-ex/cases/src/test/resources/indexer/wikipedia_realtime_index_task.json
+++ /dev/null
@@ -1,98 +0,0 @@
-{
-  "type": "index_realtime",
-  "spec": {
-    "dataSchema": {
-      "dataSource": "%%DATASOURCE%%",
-      "metricsSpec": [
-        {
-          "type": "count",
-          "name": "count"
-        },
-        {
-          "type": "doubleSum",
-          "name": "added",
-          "fieldName": "added"
-        },
-        {
-          "type": "doubleSum",
-          "name": "deleted",
-          "fieldName": "deleted"
-        },
-        {
-          "type": "doubleSum",
-          "name": "delta",
-          "fieldName": "delta"
-        }
-      ],
-      "granularitySpec": {
-        "segmentGranularity": "minute",
-        "queryGranularity": "second"
-      },
-      "parser": {
-        "type": "map",
-        "parseSpec": {
-          "format": "tsv",
-          "columns": [
-            "timestamp",
-            "page",
-            "language",
-            "user",
-            "unpatrolled",
-            "newPage",
-            "robot",
-            "anonymous",
-            "namespace",
-            "continent",
-            "country",
-            "region",
-            "city",
-            "added",
-            "deleted",
-            "delta"
-          ],
-          "timestampSpec": {
-            "column": "timestamp",
-            "format": "iso"
-          },
-          "dimensionsSpec": {
-            "dimensions": [
-              "page",
-              "language",
-              "user",
-              "unpatrolled",
-              "newPage",
-              "robot",
-              "anonymous",
-              "namespace",
-              "continent",
-              "country",
-              "region",
-              "city"
-            ]
-          }
-        }
-      }
-    },
-    "ioConfig": {
-      "type": "realtime",
-      "firehose": {
-        "type": "timed",
-        "shutoffTime": "#SHUTOFFTIME",
-        "delegate": {
-          "type": "receiver",
-          "serviceName": "eventReceiverServiceName",
-          "bufferSize": 100000
-        }
-      }
-    },
-    "tuningConfig": {
-      "type": "realtime",
-      "maxRowsInMemory": 1,
-      "intermediatePersistPeriod": "PT1M",
-      "windowPeriod": "PT1M",
-      "rejectionPolicy": {
-        "type": "serverTime"
-      }
-    }
-  }
-}
diff --git a/integration-tests-ex/cases/src/test/resources/indexer/wikipedia_union_index_task.json b/integration-tests-ex/cases/src/test/resources/indexer/wikipedia_union_index_task.json
deleted file mode 100644
index 75c1281fcd2..00000000000
--- a/integration-tests-ex/cases/src/test/resources/indexer/wikipedia_union_index_task.json
+++ /dev/null
@@ -1,98 +0,0 @@
-{
-  "type": "index_realtime",
-  "spec": {
-    "dataSchema": {
-      "dataSource": "%%DATASOURCE%%",
-      "metricsSpec": [
-        {
-          "type": "count",
-          "name": "count"
-        },
-        {
-          "type": "doubleSum",
-          "name": "added",
-          "fieldName": "added"
-        },
-        {
-          "type": "doubleSum",
-          "name": "deleted",
-          "fieldName": "deleted"
-        },
-        {
-          "type": "doubleSum",
-          "name": "delta",
-          "fieldName": "delta"
-        }
-      ],
-      "granularitySpec": {
-        "segmentGranularity": "DAY",
-        "queryGranularity": "second"
-      },
-      "parser": {
-        "type": "map",
-        "parseSpec": {
-          "format": "tsv",
-          "columns": [
-            "timestamp",
-            "page",
-            "language",
-            "user",
-            "unpatrolled",
-            "newPage",
-            "robot",
-            "anonymous",
-            "namespace",
-            "continent",
-            "country",
-            "region",
-            "city",
-            "added",
-            "deleted",
-            "delta"
-          ],
-          "timestampSpec": {
-            "column": "timestamp",
-            "format": "iso"
-          },
-          "dimensionsSpec": {
-            "dimensions": [
-              "page",
-              "language",
-              "user",
-              "unpatrolled",
-              "newPage",
-              "robot",
-              "anonymous",
-              "namespace",
-              "continent",
-              "country",
-              "region",
-              "city"
-            ]
-          }
-        }
-      }
-    },
-    "ioConfig": {
-      "type": "realtime",
-      "firehose": {
-        "type": "timed",
-        "shutoffTime": "#SHUTOFFTIME",
-        "delegate": {
-          "type": "receiver",
-          "serviceName": "eventReceiverServiceName",
-          "bufferSize": 100000
-        }
-      }
-    },
-    "tuningConfig": {
-      "type": "realtime",
-      "maxRowsInMemory": 1,
-      "intermediatePersistPeriod": "PT1M",
-      "windowPeriod": "PT1M",
-      "rejectionPolicy": {
-        "type": "none"
-      }
-    }
-  }
-}
diff --git a/integration-tests/src/test/resources/data/union_query/wikipedia_index_data.json b/integration-tests-ex/cases/src/test/resources/query/union_data.json
similarity index 100%
rename from integration-tests/src/test/resources/data/union_query/wikipedia_index_data.json
rename to integration-tests-ex/cases/src/test/resources/query/union_data.json
diff --git a/integration-tests-ex/cases/src/test/resources/query/union_kafka_supervisor_template.json b/integration-tests-ex/cases/src/test/resources/query/union_kafka_supervisor_template.json
new file mode 100644
index 00000000000..a37340fe858
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/query/union_kafka_supervisor_template.json
@@ -0,0 +1,69 @@
+{
+  "type": "kafka",
+  "dataSchema": {
+    "dataSource": "%%DATASOURCE%%",
+    "timestampSpec": {
+      "column": "timestamp",
+      "format": "auto"
+    },
+    "dimensionsSpec": {
+      "dimensions": [
+        "page",
+        "language",
+        "user",
+        "unpatrolled",
+        "newPage",
+        "robot",
+        "anonymous",
+        "namespace",
+        "continent",
+        "country",
+        "region",
+        "city"
+      ],
+      "dimensionExclusions": [],
+      "spatialDimensions": []
+    },
+    "metricsSpec": [
+      {
+        "type": "count",
+        "name": "count"
+      },
+      {
+        "type": "doubleSum",
+        "name": "added",
+        "fieldName": "added"
+      },
+      {
+        "type": "doubleSum",
+        "name": "deleted",
+        "fieldName": "deleted"
+      },
+      {
+        "type": "doubleSum",
+        "name": "delta",
+        "fieldName": "delta"
+      }
+    ],
+    "granularitySpec": {
+      "type": "uniform",
+      "segmentGranularity": "DAY",
+      "queryGranularity": "second"
+    }
+  },
+  "tuningConfig": {
+    "type": "kafka",
+    "intermediatePersistPeriod": "PT1H",
+    "maxRowsPerSegment": 5000000,
+    "maxRowsInMemory": 500000
+  },
+  "ioConfig": {
+    "topic": "%%TOPIC_VALUE%%",
+    "consumerProperties": %%STREAM_PROPERTIES_VALUE%%,
+    "taskCount": 2,
+    "replicas": 1,
+    "taskDuration": "PT120S",
+    "useEarliestOffset": true,
+    "inputFormat" : {"type": "json"}
+  }
+}
\ No newline at end of file
diff --git a/integration-tests-ex/cases/src/test/resources/query/union_queries.json b/integration-tests-ex/cases/src/test/resources/query/union_queries.json
new file mode 100644
index 00000000000..74dd6db299d
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/query/union_queries.json
@@ -0,0 +1,566 @@
+[
+  {
+    "description": "timeseries, filtered, all aggs, all",
+    "query": {
+      "queryType": "timeseries",
+      "dataSource": {
+        "type": "union",
+        "dataSources": [
+          "%%DATASOURCE%%-1", "%%DATASOURCE%%-2", "%%DATASOURCE%%-3",
+          "%%DATASOURCE%%-0"
+        ]
+      },
+      "intervals": ["2013-08-31/2013-09-01"],
+      "granularity": "all",
+      "filter": {
+        "type": "selector",
+        "dimension": "language",
+        "value": "en"
+      },
+      "aggregations": [
+        {
+          "type": "count",
+          "name": "rows"
+        },
+        {
+          "type": "longSum",
+          "fieldName": "count",
+          "name": "count"
+        },
+        {
+          "type": "doubleSum",
+          "fieldName": "added",
+          "name": "added"
+        },
+        {
+          "type": "doubleSum",
+          "fieldName": "deleted",
+          "name": "deleted"
+        },
+        {
+          "type": "doubleSum",
+          "fieldName": "delta",
+          "name": "delta"
+        }
+      ],
+      "context": {
+        "useCache": "true",
+        "populateCache": "true",
+        "timeout": 60000
+      }
+    },
+    "expectedResults": [
+      {
+        "timestamp": "2013-08-31T01:02:33.000Z",
+        "result": {
+          "added": 1548.0,
+          "count": 6,
+          "delta": 561.0,
+          "deleted": 987.0,
+          "rows": 6
+        }
+      }
+    ]
+  },
+  {
+    "description": "topN, all aggs, page dim, uniques metric",
+    "query": {
+      "queryType": "topN",
+      "dataSource": {
+        "type": "union",
+        "dataSources": [
+          "%%DATASOURCE%%-1", "%%DATASOURCE%%-2", "%%DATASOURCE%%-3",
+          "%%DATASOURCE%%-0"
+        ]
+      },
+      "intervals": ["2013-08-31/2013-09-01"],
+      "granularity": "all",
+      "aggregations": [
+        {
+          "type": "count",
+          "name": "rows"
+        },
+        {
+          "type": "longSum",
+          "fieldName": "count",
+          "name": "count"
+        },
+        {
+          "type": "doubleSum",
+          "fieldName": "added",
+          "name": "added"
+        },
+        {
+          "type": "doubleSum",
+          "fieldName": "deleted",
+          "name": "deleted"
+        },
+        {
+          "type": "doubleSum",
+          "fieldName": "delta",
+          "name": "delta"
+        }
+      ],
+      "dimension": "page",
+      "metric": "added",
+      "threshold": 3,
+      "context": {
+        "useCache": "true",
+        "populateCache": "true",
+        "timeout": 60000
+      }
+    },
+    "expectedResults": [
+      {
+        "timestamp": "2013-08-31T01:02:33.000Z",
+        "result": [
+          {
+            "added": 2715.0,
+            "count": 3,
+            "page": "Crimson Typhoon",
+            "delta": 2700.0,
+            "deleted": 15.0,
+            "rows": 3
+          },
+          {
+            "added": 1377.0,
+            "count": 3,
+            "page": "Striker Eureka",
+            "delta": 990.0,
+            "deleted": 387.0,
+            "rows": 3
+          },
+          {
+            "added": 369.0,
+            "count": 3,
+            "page": "Cherno Alpha",
+            "delta": 333.0,
+            "deleted": 36.0,
+            "rows": 3
+          }
+        ]
+      }
+    ]
+  },
+  {
+    "description": "topN, all aggs, page dim, count metric, postAggs",
+    "query": {
+      "queryType": "topN",
+      "dataSource": {
+        "type": "union",
+        "dataSources": [
+          "%%DATASOURCE%%-1", "%%DATASOURCE%%-2", "%%DATASOURCE%%-3",
+          "%%DATASOURCE%%-0"
+        ]
+      },
+      "intervals": ["2013-08-31/2013-09-01"],
+      "granularity": "all",
+      "aggregations": [
+        {
+          "type": "count",
+          "name": "rows"
+        },
+        {
+          "type": "longSum",
+          "fieldName": "count",
+          "name": "count"
+        },
+        {
+          "type": "doubleSum",
+          "fieldName": "added",
+          "name": "added"
+        },
+        {
+          "type": "doubleSum",
+          "fieldName": "deleted",
+          "name": "deleted"
+        },
+        {
+          "type": "doubleSum",
+          "fieldName": "delta",
+          "name": "delta"
+        }
+      ],
+      "postAggregations": [
+        {
+          "type": "arithmetic",
+          "name": "sumOfAddedDeletedConst",
+          "fn": "+",
+          "fields": [
+            {
+              "type": "fieldAccess",
+              "name": "added",
+              "fieldName": "added"
+            },
+            {
+              "type": "arithmetic",
+              "name": "",
+              "fn": "+",
+              "fields": [
+                {
+                  "type": "fieldAccess",
+                  "name": "deleted",
+                  "fieldName": "deleted"
+                },
+                {
+                  "type": "constant",
+                  "name": "constant",
+                  "value": 1000
+                }
+              ]
+            }
+          ]
+        }
+      ],
+      "dimension": "page",
+      "metric": "added",
+      "threshold": 3,
+      "context": {
+        "useCache": "true",
+        "populateCache": "true",
+        "timeout": 60000
+      }
+    },
+    "expectedResults": [
+      {
+        "timestamp": "2013-08-31T01:02:33.000Z",
+        "result": [
+          {
+            "added": 2715.0,
+            "count": 3,
+            "page": "Crimson Typhoon",
+            "delta": 2700.0,
+            "deleted": 15.0,
+            "sumOfAddedDeletedConst": 3730.0,
+            "rows": 3
+          },
+          {
+            "added": 1377.0,
+            "count": 3,
+            "page": "Striker Eureka",
+            "delta": 990.0,
+            "deleted": 387.0,
+            "sumOfAddedDeletedConst": 2764.0,
+            "rows": 3
+          },
+          {
+            "added": 369.0,
+            "count": 3,
+            "page": "Cherno Alpha",
+            "delta": 333.0,
+            "deleted": 36.0,
+            "sumOfAddedDeletedConst": 1405.0,
+            "rows": 3
+          }
+        ]
+      }
+    ]
+  },
+  {
+    "description": "topN, lexicographic, two aggs, language dim, postAggs",
+    "query": {
+      "queryType": "topN",
+      "dataSource": {
+        "type": "union",
+        "dataSources": [
+          "%%DATASOURCE%%-1", "%%DATASOURCE%%-2", "%%DATASOURCE%%-3",
+          "%%DATASOURCE%%-0"
+        ]
+      },
+      "intervals": ["2013-08-31/2013-09-01"],
+      "granularity": "all",
+      "aggregations": [
+        {
+          "type": "count",
+          "name": "rows"
+        },
+        {
+          "type": "longSum",
+          "fieldName": "count",
+          "name": "count"
+        }
+      ],
+      "postAggregations": [
+        {
+          "type": "arithmetic",
+          "name": "sumOfRowsAndCount",
+          "fn": "+",
+          "fields": [
+            {
+              "type": "fieldAccess",
+              "name": "rows",
+              "fieldName": "rows"
+            },
+            {
+              "type": "fieldAccess",
+              "name": "count",
+              "fieldName": "count"
+            }
+          ]
+        }
+      ],
+      "dimension": "language",
+      "metric": {
+        "type": "lexicographic",
+        "previousStop": "a"
+      },
+      "threshold": 3,
+      "context": {
+        "useCache": "true",
+        "populateCache": "true",
+        "timeout": 60000
+      }
+    },
+    "expectedResults": [
+      {
+        "timestamp": "2013-08-31T01:02:33.000Z",
+        "result": [
+          {
+            "sumOfRowsAndCount": 12.0,
+            "count": 6,
+            "language": "en",
+            "rows": 6
+          },
+          {
+            "sumOfRowsAndCount": 6.0,
+            "count": 3,
+            "language": "ja",
+            "rows": 3
+          },
+          {
+            "sumOfRowsAndCount": 6.0,
+            "count": 3,
+            "language": "ru",
+            "rows": 3
+          }
+        ]
+      }
+    ]
+  },
+  {
+    "description": "groupBy, two aggs, namespace dim, postAggs",
+    "query": {
+      "queryType": "groupBy",
+      "dataSource": {
+        "type": "union",
+        "dataSources": [
+          "%%DATASOURCE%%-1", "%%DATASOURCE%%-2", "%%DATASOURCE%%-3",
+          "%%DATASOURCE%%-0"
+        ]
+      },
+      "intervals": ["2013-08-31/2013-09-01"],
+      "granularity": "all",
+      "aggregations": [
+        {
+          "type": "count",
+          "name": "rows"
+        },
+        {
+          "type": "longSum",
+          "fieldName": "count",
+          "name": "count"
+        }
+      ],
+      "postAggregations": [
+        {
+          "type": "arithmetic",
+          "name": "sumOfRowsAndCount",
+          "fn": "+",
+          "fields": [
+            {
+              "type": "fieldAccess",
+              "name": "rows",
+              "fieldName": "rows"
+            },
+            {
+              "type": "fieldAccess",
+              "name": "count",
+              "fieldName": "count"
+            }
+          ]
+        }
+      ],
+      "dimensions": ["namespace"],
+      "context": {
+        "useCache": "true",
+        "populateCache": "true",
+        "timeout": 60000
+      }
+    },
+    "expectedResults": [
+      {
+        "version": "v1",
+        "timestamp": "2013-08-31T00:00:00.000Z",
+        "event": {
+          "sumOfRowsAndCount": 12.0,
+          "count": 6,
+          "rows": 6,
+          "namespace": "article"
+        }
+      },
+      {
+        "version": "v1",
+        "timestamp": "2013-08-31T00:00:00.000Z",
+        "event": {
+          "sumOfRowsAndCount": 18.0,
+          "count": 9,
+          "rows": 9,
+          "namespace": "wikipedia"
+        }
+      }
+    ]
+  },
+  {
+    "description": "groupBy, two aggs, namespace + robot dim, postAggs",
+    "query": {
+      "queryType": "groupBy",
+      "dataSource": {
+        "type": "union",
+        "dataSources": [
+          "%%DATASOURCE%%-1", "%%DATASOURCE%%-2", "%%DATASOURCE%%-3",
+          "%%DATASOURCE%%-0"
+        ]
+      },
+      "intervals": ["2013-08-31/2013-09-01"],
+      "granularity": "all",
+      "aggregations": [
+        {
+          "type": "count",
+          "name": "rows"
+        },
+        {
+          "type": "longSum",
+          "fieldName": "count",
+          "name": "count"
+        }
+      ],
+      "postAggregations": [
+        {
+          "type": "arithmetic",
+          "name": "sumOfRowsAndCount",
+          "fn": "+",
+          "fields": [
+            {
+              "type": "fieldAccess",
+              "name": "rows",
+              "fieldName": "rows"
+            },
+            {
+              "type": "fieldAccess",
+              "name": "count",
+              "fieldName": "count"
+            }
+          ]
+        }
+      ],
+      "dimensions": ["namespace", "robot"],
+      "limitSpec": {
+        "type": "default",
+        "limit": 3,
+        "orderBy": ["robot", "namespace"]
+      },
+      "context": {
+        "useCache": "true",
+        "populateCache": "true",
+        "timeout": 60000
+      }
+    },
+    "expectedResults": [
+      {
+        "version": "v1",
+        "timestamp": "2013-08-31T00:00:00.000Z",
+        "event": {
+          "sumOfRowsAndCount": 6.0,
+          "count": 3,
+          "robot": "false",
+          "rows": 3,
+          "namespace": "article"
+        }
+      },
+      {
+        "version": "v1",
+        "timestamp": "2013-08-31T00:00:00.000Z",
+        "event": {
+          "sumOfRowsAndCount": 6.0,
+          "count": 3,
+          "robot": "true",
+          "rows": 3,
+          "namespace": "article"
+        }
+      },
+      {
+        "version": "v1",
+        "timestamp": "2013-08-31T00:00:00.000Z",
+        "event": {
+          "sumOfRowsAndCount": 18.0,
+          "count": 9,
+          "robot": "true",
+          "rows": 9,
+          "namespace": "wikipedia"
+        }
+      }
+    ]
+  },
+  {
+    "query": {
+      "queryType": "search",
+      "intervals": ["2013-08-31/2013-09-01"],
+      "dataSource": {
+        "type": "union",
+        "dataSources": [
+          "%%DATASOURCE%%-1", "%%DATASOURCE%%-2", "%%DATASOURCE%%-3",
+          "%%DATASOURCE%%-0"
+        ]
+      },
+      "granularity": "all",
+      "query": {
+        "type": "insensitive_contains",
+        "value": "ip"
+      },
+      "context": {
+        "useCache": "true",
+        "populateCache": "true",
+        "timeout": 60000
+      }
+    },
+    "expectedResults": [
+      {
+        "timestamp": "2013-08-31T00:00:00.000Z",
+        "result": [
+          {
+            "dimension": "user",
+            "value": "triplets",
+            "count":3
+          },
+          {
+            "dimension": "namespace",
+            "value": "wikipedia",
+            "count":9
+          }
+        ]
+      }
+    ]
+  },
+  {
+    "description": "timeboundary, 1 agg, union",
+    "query": {
+      "queryType": "timeBoundary",
+      "dataSource": {
+        "type": "union",
+        "dataSources": [
+          "%%DATASOURCE%%-1", "%%DATASOURCE%%-2", "%%DATASOURCE%%-3",
+          "%%DATASOURCE%%-0"
+        ]
+      }
+    },
+    "expectedResults": [
+      {
+        "timestamp": "2013-08-31T01:02:33.000Z",
+        "result": {
+          "minTime": "2013-08-31T01:02:33.000Z",
+          "maxTime": "2013-09-01T12:41:27.000Z"
+        }
+      }
+    ]
+  }
+]
diff --git a/integration-tests/src/test/java/org/apache/druid/tests/TestNGGroup.java b/integration-tests/src/test/java/org/apache/druid/tests/TestNGGroup.java
index b3417902cef..9ba40a8d1d8 100644
--- a/integration-tests/src/test/java/org/apache/druid/tests/TestNGGroup.java
+++ b/integration-tests/src/test/java/org/apache/druid/tests/TestNGGroup.java
@@ -58,10 +58,6 @@ public class TestNGGroup
 
   public static final String QUERY_ERROR = "query-error";
 
-  public static final String CLI_INDEXER = "cli-indexer";
-
-  public static final String REALTIME_INDEX = "realtime-index";
-
   /**
    * This group can only be run individually using -Dgroups=security since it requires specific test data setup.
    */
diff --git a/integration-tests/src/test/java/org/apache/druid/tests/indexer/AbstractITRealtimeIndexTaskTest.java b/integration-tests/src/test/java/org/apache/druid/tests/indexer/AbstractITRealtimeIndexTaskTest.java
deleted file mode 100644
index fb614216c42..00000000000
--- a/integration-tests/src/test/java/org/apache/druid/tests/indexer/AbstractITRealtimeIndexTaskTest.java
+++ /dev/null
@@ -1,198 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.tests.indexer;
-
-import com.google.inject.Inject;
-import org.apache.commons.io.IOUtils;
-import org.apache.druid.curator.discovery.ServerDiscoveryFactory;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.java.util.http.client.HttpClient;
-import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
-import org.apache.druid.testing.IntegrationTestingConfig;
-import org.apache.druid.testing.guice.TestClient;
-import org.apache.druid.testing.utils.ITRetryUtil;
-import org.joda.time.DateTime;
-import org.joda.time.format.DateTimeFormat;
-import org.joda.time.format.DateTimeFormatter;
-
-import java.io.Closeable;
-import java.io.InputStream;
-import java.nio.charset.StandardCharsets;
-import java.util.concurrent.TimeUnit;
-
-/**
- * Steps
- * 1) Submit a realtime index task
- * 2) Load data using EventReceiverFirehose
- * 3) Run queries to verify that the ingested data is available for queries
- * 4) Wait for handover of the segment to historical node
- * 5) Query data (will be from historical node)
- * 6) Disable and delete the created data segment
- */
-public abstract class AbstractITRealtimeIndexTaskTest extends AbstractIndexerTest
-{
-  static final String EVENT_RECEIVER_SERVICE_NAME = "eventReceiverServiceName";
-  static final String EVENT_DATA_FILE = "/indexer/wikipedia_realtime_index_data.json";
-
-  private static final Logger LOG = new Logger(AbstractITRealtimeIndexTaskTest.class);
-  private static final String INDEX_DATASOURCE = "wikipedia_index_test";
-
-  static final int DELAY_BETWEEN_EVENTS_SECS = 4;
-  final String TIME_PLACEHOLDER = "YYYY-MM-DDTHH:MM:SS";
-  // format for putting timestamp into events
-  static final DateTimeFormatter EVENT_FMT = DateTimeFormat.forPattern("yyyy-MM-dd'T'HH:mm:ss");
-  // format for the querying interval
-  private static final DateTimeFormatter INTERVAL_FMT = DateTimeFormat.forPattern("yyyy-MM-dd'T'HH:mm:'00Z'");
-  // format for the expected timestamp in a query response
-  private static final DateTimeFormatter TIMESTAMP_FMT = DateTimeFormat.forPattern("yyyy-MM-dd'T'HH:mm:ss'.000Z'");
-  DateTime dtFirst;            // timestamp of 1st event
-  DateTime dtLast;             // timestamp of last event
-  DateTime dtGroupBy;          // timestamp for expected response for groupBy query
-
-  static final int NUM_RETRIES = 60;
-  static final long DELAY_FOR_RETRIES_MS = 10000;
-
-  @Inject
-  ServerDiscoveryFactory factory;
-  @Inject
-  @TestClient
-  HttpClient httpClient;
-
-  @Inject
-  IntegrationTestingConfig config;
-
-  private String fullDatasourceName;
-
-  void doTest()
-  {
-    fullDatasourceName = INDEX_DATASOURCE + config.getExtraDatasourceNameSuffix();
-
-    LOG.info("Starting test: %s", this.getClass().getSimpleName());
-    try (final Closeable ignored = unloader(fullDatasourceName)) {
-      // the task will run for 5 minutes and then shutdown itself
-      String task = setShutOffTime(
-          getResourceAsString(getTaskResource()),
-          DateTimes.utc(System.currentTimeMillis() + TimeUnit.MINUTES.toMillis(5))
-      );
-      task = StringUtils.replace(task, "%%DATASOURCE%%", fullDatasourceName);
-
-      LOG.info("indexerSpec: [%s]\n", task);
-      String taskID = indexer.submitTask(task);
-
-      // sleep for a while to let peons finish starting up
-      TimeUnit.SECONDS.sleep(60);
-
-      // this posts 22 events, one every 4 seconds
-      // each event contains the current time as its timestamp except
-      //   the timestamp for the 14th event is early enough that the event should be ignored
-      //   the timestamp for the 18th event is 2 seconds earlier than the 17th
-      postEvents();
-
-      // wait for a while to let the events be ingested
-      ITRetryUtil.retryUntil(
-          () -> {
-            final int countRows = queryHelper.countRows(
-                fullDatasourceName,
-                Intervals.ETERNITY,
-                name -> new LongSumAggregatorFactory(name, "count")
-            );
-            return countRows == getNumExpectedRowsIngested();
-          },
-          true,
-          DELAY_FOR_RETRIES_MS,
-          NUM_RETRIES,
-          "Waiting all events are ingested"
-      );
-
-      // put the timestamps into the query structure
-      String query_response_template;
-      InputStream is = ITRealtimeIndexTaskTest.class.getResourceAsStream(getQueriesResource());
-      if (null == is) {
-        throw new ISE("could not open query file: %s", getQueriesResource());
-      }
-      query_response_template = IOUtils.toString(is, StandardCharsets.UTF_8);
-
-      String queryStr = query_response_template;
-      queryStr = StringUtils.replace(queryStr, "%%TIMEBOUNDARY_RESPONSE_TIMESTAMP%%", TIMESTAMP_FMT.print(dtFirst));
-      queryStr = StringUtils.replace(queryStr, "%%TIMEBOUNDARY_RESPONSE_MAXTIME%%", TIMESTAMP_FMT.print(dtLast));
-      queryStr = StringUtils.replace(queryStr, "%%TIMEBOUNDARY_RESPONSE_MINTIME%%", TIMESTAMP_FMT.print(dtFirst));
-      queryStr = StringUtils.replace(queryStr, "%%TIMESERIES_QUERY_START%%", INTERVAL_FMT.print(dtFirst));
-      queryStr = StringUtils.replace(queryStr, "%%TIMESERIES_QUERY_END%%", INTERVAL_FMT.print(dtLast.plusMinutes(2)));
-      queryStr = StringUtils.replace(queryStr, "%%TIMESERIES_RESPONSE_TIMESTAMP%%", TIMESTAMP_FMT.print(dtFirst));
-      queryStr = StringUtils.replace(queryStr, "%%POST_AG_REQUEST_START%%", INTERVAL_FMT.print(dtFirst));
-      queryStr = StringUtils.replace(queryStr, "%%POST_AG_REQUEST_END%%", INTERVAL_FMT.print(dtLast.plusMinutes(2)));
-      String postAgResponseTimestamp = TIMESTAMP_FMT.print(dtGroupBy.withSecondOfMinute(0));
-      queryStr = StringUtils.replace(queryStr, "%%POST_AG_RESPONSE_TIMESTAMP%%", postAgResponseTimestamp);
-      queryStr = StringUtils.replace(queryStr, "%%DATASOURCE%%", fullDatasourceName);
-
-      // should hit the queries all on realtime task or some on realtime task
-      // and some on historical.  Which it is depends on where in the minute we were
-      // when we started posting events.
-      try {
-        this.queryHelper.testQueriesFromString(getRouterURL(), queryStr);
-      }
-      catch (Exception e) {
-        throw new RuntimeException(e);
-      }
-
-      // wait for the task to complete
-      indexer.waitUntilTaskCompletes(taskID);
-
-      // task should complete only after the segments are loaded by historical node
-      ITRetryUtil.retryUntil(
-          () -> coordinator.areSegmentsLoaded(fullDatasourceName),
-          true,
-          DELAY_FOR_RETRIES_MS,
-          NUM_RETRIES,
-          "Real-time generated segments loaded"
-      );
-
-      // queries should be answered by historical
-      this.queryHelper.testQueriesFromString(getRouterURL(), queryStr);
-    }
-    catch (Exception e) {
-      throw new RuntimeException(e);
-    }
-  }
-
-  private String setShutOffTime(String taskAsString, DateTime time)
-  {
-    return StringUtils.replace(taskAsString, "#SHUTOFFTIME", time.toString());
-  }
-
-  private String getRouterURL()
-  {
-    return StringUtils.format(
-        "%s/druid/v2?pretty",
-        config.getRouterUrl()
-    );
-  }
-
-  abstract String getTaskResource();
-  abstract String getQueriesResource();
-
-  abstract void postEvents() throws Exception;
-
-  abstract int getNumExpectedRowsIngested();
-}
diff --git a/integration-tests/src/test/java/org/apache/druid/tests/indexer/AbstractIndexerTest.java b/integration-tests/src/test/java/org/apache/druid/tests/indexer/AbstractIndexerTest.java
index 8a382287d43..2bcf8ea5891 100644
--- a/integration-tests/src/test/java/org/apache/druid/tests/indexer/AbstractIndexerTest.java
+++ b/integration-tests/src/test/java/org/apache/druid/tests/indexer/AbstractIndexerTest.java
@@ -171,7 +171,7 @@ public abstract class AbstractIndexerTest
 
   public static InputStream getResourceAsStream(String resource)
   {
-    return ITRealtimeIndexTaskTest.class.getResourceAsStream(resource);
+    return ITCompactionTaskTest.class.getResourceAsStream(resource);
   }
 
   public static List<String> listResources(String dir) throws IOException
diff --git a/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITAppenderatorDriverRealtimeIndexTaskTest.java b/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITAppenderatorDriverRealtimeIndexTaskTest.java
deleted file mode 100644
index b69ac027675..00000000000
--- a/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITAppenderatorDriverRealtimeIndexTaskTest.java
+++ /dev/null
@@ -1,153 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.tests.indexer;
-
-import org.apache.druid.curator.discovery.ServerDiscoverySelector;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.jackson.JacksonUtils;
-import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.testing.clients.EventReceiverFirehoseTestClient;
-import org.apache.druid.testing.guice.DruidTestModuleFactory;
-import org.apache.druid.testing.utils.ServerDiscoveryUtil;
-import org.apache.druid.tests.TestNGGroup;
-import org.joda.time.DateTime;
-import org.testng.annotations.Guice;
-import org.testng.annotations.Test;
-
-import javax.ws.rs.core.MediaType;
-import java.io.BufferedReader;
-import java.io.InputStreamReader;
-import java.nio.charset.StandardCharsets;
-import java.util.ArrayList;
-import java.util.Collection;
-import java.util.Map;
-
-/**
- * See {@link AbstractITRealtimeIndexTaskTest} for test details.
- */
-@Test(groups = {TestNGGroup.REALTIME_INDEX, TestNGGroup.CDS_TASK_SCHEMA_PUBLISH_DISABLED, TestNGGroup.CDS_COORDINATOR_METADATA_QUERY_DISABLED})
-@Guice(moduleFactory = DruidTestModuleFactory.class)
-public class ITAppenderatorDriverRealtimeIndexTaskTest extends AbstractITRealtimeIndexTaskTest
-{
-  private static final Logger LOG = new Logger(ITAppenderatorDriverRealtimeIndexTaskTest.class);
-  private static final String REALTIME_TASK_RESOURCE = "/indexer/wikipedia_realtime_appenderator_index_task.json";
-  private static final String REALTIME_QUERIES_RESOURCE = "/indexer/wikipedia_realtime_appenderator_index_queries.json";
-  /**
-   * The expected number of rows ingested for this test.
-   * The total number of rows of raw data is 22 and there's no rollup.
-   */
-  private static final int EXPECTED_NUM_ROWS = 22;
-
-  @Test
-  public void testRealtimeIndexTask()
-  {
-    doTest();
-  }
-
-  @Override
-  void postEvents() throws Exception
-  {
-    final ServerDiscoverySelector eventReceiverSelector = factory.createSelector(EVENT_RECEIVER_SERVICE_NAME);
-    eventReceiverSelector.start();
-    InputStreamReader isr;
-    try {
-      isr = new InputStreamReader(
-          ITRealtimeIndexTaskTest.class.getResourceAsStream(EVENT_DATA_FILE),
-          StandardCharsets.UTF_8
-      );
-    }
-    catch (Exception e) {
-      throw new RuntimeException(e);
-    }
-    try (BufferedReader reader = new BufferedReader(isr)) {
-      ServerDiscoveryUtil.waitUntilInstanceReady(eventReceiverSelector, "Event Receiver");
-      // Use the host from the config file and the port announced in zookeeper
-      String host = config.getMiddleManagerHost() + ":" + eventReceiverSelector.pick().getPort();
-      LOG.info("Event Receiver Found at host [%s]", host);
-      EventReceiverFirehoseTestClient client = new EventReceiverFirehoseTestClient(
-          host,
-          EVENT_RECEIVER_SERVICE_NAME,
-          jsonMapper,
-          httpClient,
-          smileMapper
-      );
-      // there are 22 lines in the file
-      int i = 1;
-      DateTime dt = DateTimes.nowUtc();  // timestamp used for sending each event
-      dtFirst = dt;
-      dtLast = dt;
-      String line;
-      while ((line = reader.readLine()) != null) {
-        if (i == 15) { // for the 15th line, use a time before the window
-          dt = dt.minusMinutes(10);
-          dtFirst = dt; // oldest timestamp
-        } else if (i == 16) { // remember this time to use in the expected response from the groupBy query
-          dtGroupBy = dt;
-        } else if (i == 18) { // use a time 6 seconds ago so it will be out of order
-          dt = dt.minusSeconds(6);
-        }
-        String event = StringUtils.replace(line, TIME_PLACEHOLDER, EVENT_FMT.print(dt));
-        LOG.info("sending event: [%s]\n", event);
-        Collection<Map<String, Object>> events = new ArrayList<>();
-        events.add(this.jsonMapper.readValue(event, JacksonUtils.TYPE_REFERENCE_MAP_STRING_OBJECT));
-        int eventsPosted = client.postEvents(events, this.jsonMapper, MediaType.APPLICATION_JSON);
-        if (eventsPosted != events.size()) {
-          throw new ISE("Event not posted");
-        }
-
-        try {
-          Thread.sleep(DELAY_BETWEEN_EVENTS_SECS * 1000);
-        }
-        catch (InterruptedException ignored) {
-          /* nothing */
-        }
-        dtLast = dt; // latest timestamp
-        dt = DateTimes.nowUtc();
-        i++;
-      }
-    }
-    catch (Exception e) {
-      throw new RuntimeException(e);
-    }
-    finally {
-      eventReceiverSelector.stop();
-    }
-  }
-
-  @Override
-  String getTaskResource()
-  {
-    return REALTIME_TASK_RESOURCE;
-  }
-
-  @Override
-  String getQueriesResource()
-  {
-    return REALTIME_QUERIES_RESOURCE;
-  }
-
-  @Override
-  int getNumExpectedRowsIngested()
-  {
-    return EXPECTED_NUM_ROWS;
-  }
-}
diff --git a/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITRealtimeIndexTaskTest.java b/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITRealtimeIndexTaskTest.java
deleted file mode 100644
index be3f518b098..00000000000
--- a/integration-tests/src/test/java/org/apache/druid/tests/indexer/ITRealtimeIndexTaskTest.java
+++ /dev/null
@@ -1,152 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.tests.indexer;
-
-import org.apache.druid.curator.discovery.ServerDiscoverySelector;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.jackson.JacksonUtils;
-import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.testing.clients.EventReceiverFirehoseTestClient;
-import org.apache.druid.testing.guice.DruidTestModuleFactory;
-import org.apache.druid.testing.utils.ServerDiscoveryUtil;
-import org.apache.druid.tests.TestNGGroup;
-import org.joda.time.DateTime;
-import org.testng.annotations.Guice;
-import org.testng.annotations.Test;
-
-import javax.ws.rs.core.MediaType;
-import java.io.BufferedReader;
-import java.io.InputStreamReader;
-import java.nio.charset.StandardCharsets;
-import java.util.ArrayList;
-import java.util.Collection;
-import java.util.Map;
-
-/**
- * See {@link AbstractITRealtimeIndexTaskTest} for test details.
- */
-@Test(groups = {TestNGGroup.REALTIME_INDEX, TestNGGroup.CDS_TASK_SCHEMA_PUBLISH_DISABLED, TestNGGroup.CDS_COORDINATOR_METADATA_QUERY_DISABLED})
-@Guice(moduleFactory = DruidTestModuleFactory.class)
-public class ITRealtimeIndexTaskTest extends AbstractITRealtimeIndexTaskTest
-{
-  private static final Logger LOG = new Logger(ITRealtimeIndexTaskTest.class);
-  private static final String REALTIME_TASK_RESOURCE = "/indexer/wikipedia_realtime_index_task.json";
-  private static final String REALTIME_QUERIES_RESOURCE = "/indexer/wikipedia_realtime_index_queries.json";
-  /**
-   * The expected number of rows ingested for this test.
-   * The total number of rows of raw data is 22, but two rows will be rolled up into one row.
-   */
-  private static final int EXPECTED_NUM_ROWS = 21;
-
-  @Test
-  public void testRealtimeIndexTask()
-  {
-    doTest();
-  }
-
-  @Override
-  String getTaskResource()
-  {
-    return REALTIME_TASK_RESOURCE;
-  }
-
-  @Override
-  String getQueriesResource()
-  {
-    return REALTIME_QUERIES_RESOURCE;
-  }
-
-  @Override
-  int getNumExpectedRowsIngested()
-  {
-    return EXPECTED_NUM_ROWS;
-  }
-
-  @Override
-  void postEvents() throws Exception
-  {
-    final ServerDiscoverySelector eventReceiverSelector = factory.createSelector(EVENT_RECEIVER_SERVICE_NAME);
-    eventReceiverSelector.start();
-    InputStreamReader isr;
-    try {
-      isr = new InputStreamReader(
-          ITRealtimeIndexTaskTest.class.getResourceAsStream(EVENT_DATA_FILE),
-          StandardCharsets.UTF_8
-      );
-    }
-    catch (Exception e) {
-      throw new RuntimeException(e);
-    }
-    try (BufferedReader reader = new BufferedReader(isr)) {
-      ServerDiscoveryUtil.waitUntilInstanceReady(eventReceiverSelector, "Event Receiver");
-      // Use the host from the config file and the port announced in zookeeper
-      String host = config.getMiddleManagerHost() + ":" + eventReceiverSelector.pick().getPort();
-      LOG.info("Event Receiver Found at host [%s]", host);
-      EventReceiverFirehoseTestClient client = new EventReceiverFirehoseTestClient(
-          host,
-          EVENT_RECEIVER_SERVICE_NAME,
-          jsonMapper,
-          httpClient,
-          smileMapper
-      );
-      // there are 22 lines in the file
-      int i = 1;
-      DateTime dt = DateTimes.nowUtc();  // timestamp used for sending each event
-      dtFirst = dt;                      // timestamp of 1st event
-      dtLast = dt;                       // timestamp of last event
-      String line;
-      while ((line = reader.readLine()) != null) {
-        if (i == 15) { // for the 15th line, use a time before the window
-          dt = dt.minusMinutes(10);
-        } else if (i == 16) { // remember this time to use in the expected response from the groupBy query
-          dtGroupBy = dt;
-        } else if (i == 18) { // use a time 6 seconds ago so it will be out of order
-          dt = dt.minusSeconds(6);
-        }
-        String event = StringUtils.replace(line, TIME_PLACEHOLDER, EVENT_FMT.print(dt));
-        LOG.info("sending event: [%s]\n", event);
-        Collection<Map<String, Object>> events = new ArrayList<>();
-        events.add(this.jsonMapper.readValue(event, JacksonUtils.TYPE_REFERENCE_MAP_STRING_OBJECT));
-        int eventsPosted = client.postEvents(events, this.jsonMapper, MediaType.APPLICATION_JSON);
-        if (eventsPosted != events.size()) {
-          throw new ISE("Event not posted");
-        }
-
-        try {
-          Thread.sleep(DELAY_BETWEEN_EVENTS_SECS * 1000);
-        }
-        catch (InterruptedException ignored) {
-          /* nothing */
-        }
-        dtLast = dt;
-        dt = DateTimes.nowUtc();
-        i++;
-      }
-    }
-    catch (Exception e) {
-      throw new RuntimeException(e);
-    }
-    finally {
-      eventReceiverSelector.stop();
-    }
-  }
-}
diff --git a/integration-tests/src/test/java/org/apache/druid/tests/query/ITUnionQueryTest.java b/integration-tests/src/test/java/org/apache/druid/tests/query/ITUnionQueryTest.java
deleted file mode 100644
index 7eedcbb7317..00000000000
--- a/integration-tests/src/test/java/org/apache/druid/tests/query/ITUnionQueryTest.java
+++ /dev/null
@@ -1,248 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.tests.query;
-
-import com.google.inject.Inject;
-import org.apache.commons.io.IOUtils;
-import org.apache.druid.curator.discovery.ServerDiscoveryFactory;
-import org.apache.druid.curator.discovery.ServerDiscoverySelector;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.io.Closer;
-import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.java.util.http.client.HttpClient;
-import org.apache.druid.java.util.http.client.Request;
-import org.apache.druid.java.util.http.client.response.StatusResponseHandler;
-import org.apache.druid.java.util.http.client.response.StatusResponseHolder;
-import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
-import org.apache.druid.testing.IntegrationTestingConfig;
-import org.apache.druid.testing.clients.EventReceiverFirehoseTestClient;
-import org.apache.druid.testing.guice.DruidTestModuleFactory;
-import org.apache.druid.testing.guice.TestClient;
-import org.apache.druid.testing.utils.ITRetryUtil;
-import org.apache.druid.testing.utils.ServerDiscoveryUtil;
-import org.apache.druid.tests.TestNGGroup;
-import org.apache.druid.tests.indexer.AbstractITBatchIndexTest;
-import org.apache.druid.tests.indexer.AbstractIndexerTest;
-import org.jboss.netty.handler.codec.http.HttpMethod;
-import org.jboss.netty.handler.codec.http.HttpResponseStatus;
-import org.joda.time.DateTime;
-import org.testng.annotations.BeforeSuite;
-import org.testng.annotations.Guice;
-import org.testng.annotations.Test;
-
-import java.io.IOException;
-import java.io.InputStream;
-import java.net.URL;
-import java.nio.charset.StandardCharsets;
-import java.util.ArrayList;
-import java.util.List;
-import java.util.concurrent.TimeUnit;
-
-@Test(groups = {TestNGGroup.QUERY, TestNGGroup.CENTRALIZED_DATASOURCE_SCHEMA})
-@Guice(moduleFactory = DruidTestModuleFactory.class)
-public class ITUnionQueryTest extends AbstractIndexerTest
-{
-  private static final Logger LOG = new Logger(ITUnionQueryTest.class);
-  private static final String UNION_TASK_RESOURCE = "/indexer/wikipedia_union_index_task.json";
-  private static final String EVENT_RECEIVER_SERVICE_PREFIX = "eventReceiverServiceName";
-  private static final String UNION_DATA_FILE = "/data/union_query/wikipedia_index_data.json";
-  private static final String UNION_QUERIES_RESOURCE = "/queries/union_queries.json";
-  private static final String UNION_DATASOURCE = "wikipedia_index_test";
-
-  @Inject
-  ServerDiscoveryFactory factory;
-
-  @Inject
-  @TestClient
-  HttpClient httpClient;
-
-  @Inject
-  IntegrationTestingConfig config;
-
-  private String fullDatasourceName;
-
-  @BeforeSuite
-  public void setFullDatasourceName()
-  {
-    fullDatasourceName = UNION_DATASOURCE + config.getExtraDatasourceNameSuffix();
-  }
-
-  @Test
-  public void testUnionQuery() throws IOException
-  {
-    final int numTasks = 3;
-    final Closer closer = Closer.create();
-    for (int i = 0; i < numTasks; i++) {
-      closer.register(unloader(fullDatasourceName + i));
-    }
-    try {
-      // Load 3 datasources with same dimensions
-      String task = setShutOffTime(
-          getResourceAsString(UNION_TASK_RESOURCE),
-          DateTimes.utc(System.currentTimeMillis() + TimeUnit.MINUTES.toMillis(3))
-      );
-      List<String> taskIDs = new ArrayList<>();
-      for (int i = 0; i < numTasks; i++) {
-        taskIDs.add(
-            indexer.submitTask(
-                withServiceName(
-                    withDataSource(task, fullDatasourceName + i),
-                    EVENT_RECEIVER_SERVICE_PREFIX + i
-                )
-            )
-        );
-      }
-      for (int i = 0; i < numTasks; i++) {
-        postEvents(i);
-      }
-
-      // wait until all events are ingested
-      ITRetryUtil.retryUntil(
-          () -> {
-            for (int i = 0; i < numTasks; i++) {
-              final int countRows = queryHelper.countRows(
-                  fullDatasourceName + i,
-                  Intervals.of("2013-08-31/2013-09-01"),
-                  name -> new LongSumAggregatorFactory(name, "count")
-              );
-
-              // there are 10 rows, but query only covers the first 5
-              if (countRows < 5) {
-                LOG.warn("%d events have been ingested to %s so far", countRows, fullDatasourceName + i);
-                return false;
-              }
-            }
-            return true;
-          },
-          true,
-          1000,
-          100,
-          "Waiting all events are ingested"
-      );
-
-      // should hit the queries on realtime task
-      LOG.info("Running Union Queries..");
-
-      String queryResponseTemplate;
-      try {
-        InputStream is = AbstractITBatchIndexTest.class.getResourceAsStream(UNION_QUERIES_RESOURCE);
-        queryResponseTemplate = IOUtils.toString(is, StandardCharsets.UTF_8);
-      }
-      catch (IOException e) {
-        throw new ISE(e, "could not read query file: %s", UNION_QUERIES_RESOURCE);
-      }
-
-      queryResponseTemplate = StringUtils.replace(
-          queryResponseTemplate,
-          "%%DATASOURCE%%",
-          fullDatasourceName
-      );
-
-      this.queryHelper.testQueriesFromString(queryResponseTemplate);
-
-      // wait for the task to complete
-      for (int i = 0; i < numTasks; i++) {
-        indexer.waitUntilTaskCompletes(taskIDs.get(i));
-      }
-      // task should complete only after the segments are loaded by historical node
-      for (int i = 0; i < numTasks; i++) {
-        final int taskNum = i;
-        ITRetryUtil.retryUntil(
-            () -> coordinator.areSegmentsLoaded(fullDatasourceName + taskNum),
-            true,
-            10000,
-            10,
-            "Real-time generated segments loaded"
-        );
-      }
-      // run queries on historical nodes
-      this.queryHelper.testQueriesFromString(queryResponseTemplate);
-
-    }
-    catch (Throwable e) {
-      throw closer.rethrow(e);
-    }
-    finally {
-      closer.close();
-    }
-  }
-
-  private String setShutOffTime(String taskAsString, DateTime time)
-  {
-    return StringUtils.replace(taskAsString, "#SHUTOFFTIME", time.toString());
-  }
-
-  private String withDataSource(String taskAsString, String dataSource)
-  {
-    return StringUtils.replace(taskAsString, "%%DATASOURCE%%", dataSource);
-  }
-
-  private String withServiceName(String taskAsString, String serviceName)
-  {
-    return StringUtils.replace(taskAsString, EVENT_RECEIVER_SERVICE_PREFIX, serviceName);
-  }
-
-  private void postEvents(int id) throws Exception
-  {
-    final ServerDiscoverySelector eventReceiverSelector = factory.createSelector(EVENT_RECEIVER_SERVICE_PREFIX + id);
-    eventReceiverSelector.start();
-    try {
-      ServerDiscoveryUtil.waitUntilInstanceReady(eventReceiverSelector, "Event Receiver");
-      // Access the docker VM mapped host and port instead of service announced in zookeeper
-      String host = config.getMiddleManagerHost() + ":" + eventReceiverSelector.pick().getPort();
-
-      LOG.info("Event Receiver Found at host [%s]", host);
-
-      LOG.info("Checking worker /status/health for [%s]", host);
-      ITRetryUtil.retryUntilTrue(
-          () -> {
-            try {
-              StatusResponseHolder response = httpClient.go(
-                  new Request(HttpMethod.GET, new URL(StringUtils.format("https://%s/status/health", host))),
-                  StatusResponseHandler.getInstance()
-              ).get();
-              return response.getStatus().equals(HttpResponseStatus.OK);
-            }
-            catch (Throwable e) {
-              LOG.error(e, "");
-              return false;
-            }
-          },
-          StringUtils.format("Checking /status/health for worker [%s]", host)
-      );
-      LOG.info("Finished checking worker /status/health for [%s], success", host);
-
-      EventReceiverFirehoseTestClient client = new EventReceiverFirehoseTestClient(
-          host,
-          EVENT_RECEIVER_SERVICE_PREFIX + id,
-          jsonMapper,
-          httpClient,
-          smileMapper
-      );
-      client.postEventsFromFile(UNION_DATA_FILE);
-    }
-    finally {
-      eventReceiverSelector.stop();
-    }
-  }
-}
diff --git a/integration-tests/src/test/resources/data/broadcast/wikipedia_index_data.json b/integration-tests/src/test/resources/data/broadcast/wikipedia_index_data.json
new file mode 100644
index 00000000000..d9a67cdfb70
--- /dev/null
+++ b/integration-tests/src/test/resources/data/broadcast/wikipedia_index_data.json
@@ -0,0 +1,10 @@
+{"timestamp": "2013-08-31T01:02:33Z", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 57, "deleted": 200, "delta": -143}
+{"timestamp": "2013-08-31T03:32:45Z", "page": "Striker Eureka", "language" : "en", "user" : "speed", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Australia", "country":"Australia", "region":"Cantebury", "city":"Syndey", "added": 459, "deleted": 129, "delta": 330}
+{"timestamp": "2013-08-31T07:11:21Z", "page": "Cherno Alpha", "language" : "ru", "user" : "masterYi", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"article", "continent":"Asia", "country":"Russia", "region":"Oblast", "city":"Moscow", "added": 123, "deleted": 12, "delta": 111}
+{"timestamp": "2013-08-31T11:58:39Z", "page": "Crimson Typhoon", "language" : "zh", "user" : "triplets", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"China", "region":"Shanxi", "city":"Taiyuan", "added": 905, "deleted": 5, "delta": 900}
+{"timestamp": "2013-08-31T12:41:27Z", "page": "Coyote Tango", "language" : "ja", "user" : "stringer", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"Japan", "region":"Kanto", "city":"Tokyo", "added": 1, "deleted": 10, "delta": -9}
+{"timestamp": "2013-09-01T01:02:33Z", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 57, "deleted": 200, "delta": -143}
+{"timestamp": "2013-09-01T03:32:45Z", "page": "Striker Eureka", "language" : "en", "user" : "speed", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Australia", "country":"Australia", "region":"Cantebury", "city":"Syndey", "added": 459, "deleted": 129, "delta": 330}
+{"timestamp": "2013-09-01T07:11:21Z", "page": "Cherno Alpha", "language" : "ru", "user" : "masterYi", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"article", "continent":"Asia", "country":"Russia", "region":"Oblast", "city":"Moscow", "added": 123, "deleted": 12, "delta": 111}
+{"timestamp": "2013-09-01T11:58:39Z", "page": "Crimson Typhoon", "language" : "zh", "user" : "triplets", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"China", "region":"Shanxi", "city":"Taiyuan", "added": 905, "deleted": 5, "delta": 900}
+{"timestamp": "2013-09-01T12:41:27Z", "page": "Coyote Tango", "language" : "ja", "user" : "stringer", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"Japan", "region":"Kanto", "city":"Tokyo", "added": 1, "deleted": 10, "delta": -9}
diff --git a/integration-tests/src/test/resources/indexer/broadcast_join_index_task.json b/integration-tests/src/test/resources/indexer/broadcast_join_index_task.json
index 20c3b162ea6..699ca547ff4 100644
--- a/integration-tests/src/test/resources/indexer/broadcast_join_index_task.json
+++ b/integration-tests/src/test/resources/indexer/broadcast_join_index_task.json
@@ -61,7 +61,7 @@
       "type": "index_parallel",
       "inputSource": {
         "type": "local",
-        "baseDir": "/resources/data/union_query/",
+        "baseDir": "/resources/data/broadcast/",
         "filter": "wikipedia_index_data*"
       },
       "appendToExisting": false,
diff --git a/integration-tests/src/test/resources/indexer/wikipedia_realtime_appenderator_index_task.json b/integration-tests/src/test/resources/indexer/wikipedia_realtime_appenderator_index_task.json
deleted file mode 100644
index 9e773609cb7..00000000000
--- a/integration-tests/src/test/resources/indexer/wikipedia_realtime_appenderator_index_task.json
+++ /dev/null
@@ -1,94 +0,0 @@
-{
-  "type": "index_realtime_appenderator",
-  "spec": {
-    "dataSchema": {
-      "dataSource": "%%DATASOURCE%%",
-      "metricsSpec": [
-        {
-          "type": "count",
-          "name": "count"
-        },
-        {
-          "type": "doubleSum",
-          "name": "added",
-          "fieldName": "added"
-        },
-        {
-          "type": "doubleSum",
-          "name": "deleted",
-          "fieldName": "deleted"
-        },
-        {
-          "type": "doubleSum",
-          "name": "delta",
-          "fieldName": "delta"
-        }
-      ],
-      "granularitySpec": {
-        "segmentGranularity": "minute",
-        "queryGranularity": "second"
-      },
-      "parser": {
-        "type": "map",
-        "parseSpec": {
-          "format": "tsv",
-          "columns": [
-            "timestamp",
-            "page",
-            "language",
-            "user",
-            "unpatrolled",
-            "newPage",
-            "robot",
-            "anonymous",
-            "namespace",
-            "continent",
-            "country",
-            "region",
-            "city",
-            "added",
-            "deleted",
-            "delta"
-          ],
-          "timestampSpec": {
-            "column": "timestamp",
-            "format": "iso"
-          },
-          "dimensionsSpec": {
-            "dimensions": [
-              "page",
-              "language",
-              "user",
-              "unpatrolled",
-              "newPage",
-              "robot",
-              "anonymous",
-              "namespace",
-              "continent",
-              "country",
-              "region",
-              "city"
-            ]
-          }
-        }
-      }
-    },
-    "ioConfig": {
-      "type": "realtime",
-      "firehose": {
-        "type": "timed",
-        "shutoffTime": "#SHUTOFFTIME",
-        "delegate": {
-          "type": "receiver",
-          "serviceName": "eventReceiverServiceName",
-          "bufferSize": 100000
-        }
-      }
-    },
-    "tuningConfig": {
-      "type": "realtime_appenderator",
-      "maxRowsInMemory": 1,
-      "intermediatePersistPeriod": "PT1M"
-    }
-  }
-}
diff --git a/integration-tests/src/test/resources/indexer/wikipedia_realtime_index_data.json b/integration-tests/src/test/resources/indexer/wikipedia_realtime_index_data.json
deleted file mode 100644
index 626bb2df861..00000000000
--- a/integration-tests/src/test/resources/indexer/wikipedia_realtime_index_data.json
+++ /dev/null
@@ -1,22 +0,0 @@
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 1, "deleted": 1, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Striker Eureka", "language" : "en", "user" : "speed", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Australia", "country":"Australia", "region":"Cantebury", "city":"Syndey", "added": 3, "deleted": 3, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Cherno Alpha", "language" : "ru", "user" : "masterYi", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"article", "continent":"Asia", "country":"Russia", "region":"Oblast", "city":"Moscow", "added": 5, "deleted": 5, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 7, "deleted": 3, "delta": 4}
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Coyote Tango", "language" : "ja", "user" : "stringer", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"Japan", "region":"Kanto", "city":"Tokyo", "added": 11, "deleted": 11, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 13, "deleted": 13, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 17, "deleted": 17, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Striker Eureka", "language" : "en", "user" : "speed", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Australia", "country":"Australia", "region":"Cantebury", "city":"Syndey", "added": 19, "deleted": 19, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Cherno Alpha", "language" : "ru", "user" : "masterYi", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"article", "continent":"Asia", "country":"Russia", "region":"Oblast", "city":"Moscow", "added": 23, "deleted": 23, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Striker Eureka", "language" : "en", "user" : "speed", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Australia", "country":"Australia", "region":"Cantebury", "city":"Syndey", "added": 29, "deleted": 31, "delta": -1}
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Coyote Tango", "language" : "ja", "user" : "stringer", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"Japan", "region":"Kanto", "city":"Tokyo", "added": 31, "deleted": 31, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 37, "deleted": 37, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 41, "deleted": 41, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Striker Eureka", "language" : "en", "user" : "speed", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Australia", "country":"Australia", "region":"Cantebury", "city":"Syndey", "added": 43, "deleted": 43, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Cherno Alpha", "language" : "ru", "user" : "masterYi", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"article", "continent":"Asia", "country":"Russia", "region":"Oblast", "city":"Moscow", "added": 47, "deleted": 47, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Crimson Typhoon", "language" : "zh", "user" : "triplets", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"China", "region":"Shanxi", "city":"Taiyuan", "added": 905, "deleted": 5, "delta": 900}
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Coyote Tango", "language" : "ja", "user" : "stringer", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"Japan", "region":"Kanto", "city":"Tokyo", "added": 59, "deleted": 59, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 61, "deleted": 61, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 67, "deleted": 67, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 71, "deleted": 71, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Striker Eureka", "language" : "en", "user" : "speed", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Australia", "country":"Australia", "region":"Cantebury", "city":"Syndey", "added": 73, "deleted": 73, "delta": 0},
-{"timestamp": "YYYY-MM-DDTHH:MM:SSZ", "page": "Cherno Alpha", "language" : "ru", "user" : "masterYi", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"article", "continent":"Asia", "country":"Russia", "region":"Oblast", "city":"Moscow", "added": 79, "deleted": 79, "delta": 0}
diff --git a/integration-tests/src/test/resources/indexer/wikipedia_realtime_index_task.json b/integration-tests/src/test/resources/indexer/wikipedia_realtime_index_task.json
deleted file mode 100644
index 5f48162c488..00000000000
--- a/integration-tests/src/test/resources/indexer/wikipedia_realtime_index_task.json
+++ /dev/null
@@ -1,98 +0,0 @@
-{
-  "type": "index_realtime",
-  "spec": {
-    "dataSchema": {
-      "dataSource": "%%DATASOURCE%%",
-      "metricsSpec": [
-        {
-          "type": "count",
-          "name": "count"
-        },
-        {
-          "type": "doubleSum",
-          "name": "added",
-          "fieldName": "added"
-        },
-        {
-          "type": "doubleSum",
-          "name": "deleted",
-          "fieldName": "deleted"
-        },
-        {
-          "type": "doubleSum",
-          "name": "delta",
-          "fieldName": "delta"
-        }
-      ],
-      "granularitySpec": {
-        "segmentGranularity": "minute",
-        "queryGranularity": "second"
-      },
-      "parser": {
-        "type": "map",
-        "parseSpec": {
-          "format": "tsv",
-          "columns": [
-            "timestamp",
-            "page",
-            "language",
-            "user",
-            "unpatrolled",
-            "newPage",
-            "robot",
-            "anonymous",
-            "namespace",
-            "continent",
-            "country",
-            "region",
-            "city",
-            "added",
-            "deleted",
-            "delta"
-          ],
-          "timestampSpec": {
-            "column": "timestamp",
-            "format": "iso"
-          },
-          "dimensionsSpec": {
-            "dimensions": [
-              "page",
-              "language",
-              "user",
-              "unpatrolled",
-              "newPage",
-              "robot",
-              "anonymous",
-              "namespace",
-              "continent",
-              "country",
-              "region",
-              "city"
-            ]
-          }
-        }
-      }
-    },
-    "ioConfig": {
-      "type": "realtime",
-      "firehose": {
-        "type": "timed",
-        "shutoffTime": "#SHUTOFFTIME",
-        "delegate": {
-          "type": "receiver",
-          "serviceName": "eventReceiverServiceName",
-          "bufferSize": 100000
-        }
-      }
-    },
-    "tuningConfig": {
-      "type": "realtime",
-      "maxRowsInMemory": 1,
-      "intermediatePersistPeriod": "PT1M",
-      "windowPeriod": "PT1M",
-      "rejectionPolicy": {
-        "type": "serverTime"
-      }
-    }
-  }
-}
diff --git a/integration-tests/src/test/resources/indexer/wikipedia_union_index_task.json b/integration-tests/src/test/resources/indexer/wikipedia_union_index_task.json
deleted file mode 100644
index 75c1281fcd2..00000000000
--- a/integration-tests/src/test/resources/indexer/wikipedia_union_index_task.json
+++ /dev/null
@@ -1,98 +0,0 @@
-{
-  "type": "index_realtime",
-  "spec": {
-    "dataSchema": {
-      "dataSource": "%%DATASOURCE%%",
-      "metricsSpec": [
-        {
-          "type": "count",
-          "name": "count"
-        },
-        {
-          "type": "doubleSum",
-          "name": "added",
-          "fieldName": "added"
-        },
-        {
-          "type": "doubleSum",
-          "name": "deleted",
-          "fieldName": "deleted"
-        },
-        {
-          "type": "doubleSum",
-          "name": "delta",
-          "fieldName": "delta"
-        }
-      ],
-      "granularitySpec": {
-        "segmentGranularity": "DAY",
-        "queryGranularity": "second"
-      },
-      "parser": {
-        "type": "map",
-        "parseSpec": {
-          "format": "tsv",
-          "columns": [
-            "timestamp",
-            "page",
-            "language",
-            "user",
-            "unpatrolled",
-            "newPage",
-            "robot",
-            "anonymous",
-            "namespace",
-            "continent",
-            "country",
-            "region",
-            "city",
-            "added",
-            "deleted",
-            "delta"
-          ],
-          "timestampSpec": {
-            "column": "timestamp",
-            "format": "iso"
-          },
-          "dimensionsSpec": {
-            "dimensions": [
-              "page",
-              "language",
-              "user",
-              "unpatrolled",
-              "newPage",
-              "robot",
-              "anonymous",
-              "namespace",
-              "continent",
-              "country",
-              "region",
-              "city"
-            ]
-          }
-        }
-      }
-    },
-    "ioConfig": {
-      "type": "realtime",
-      "firehose": {
-        "type": "timed",
-        "shutoffTime": "#SHUTOFFTIME",
-        "delegate": {
-          "type": "receiver",
-          "serviceName": "eventReceiverServiceName",
-          "bufferSize": 100000
-        }
-      }
-    },
-    "tuningConfig": {
-      "type": "realtime",
-      "maxRowsInMemory": 1,
-      "intermediatePersistPeriod": "PT1M",
-      "windowPeriod": "PT1M",
-      "rejectionPolicy": {
-        "type": "none"
-      }
-    }
-  }
-}
diff --git a/integration-tests/src/test/resources/queries/union_queries.json b/integration-tests/src/test/resources/queries/union_queries.json
deleted file mode 100644
index 627af04edc9..00000000000
--- a/integration-tests/src/test/resources/queries/union_queries.json
+++ /dev/null
@@ -1,566 +0,0 @@
-[
-    {
-        "description": "timeseries, filtered, all aggs, all",
-        "query": {
-            "queryType": "timeseries",
-            "dataSource": {
-                "type": "union",
-                "dataSources": [
-                    "%%DATASOURCE%%1", "%%DATASOURCE%%2", "%%DATASOURCE%%3",
-                    "%%DATASOURCE%%0"
-                ]
-            },
-            "intervals": ["2013-08-31/2013-09-01"],
-            "granularity": "all",
-            "filter": {
-                "type": "selector",
-                "dimension": "language",
-                "value": "en"
-            },
-            "aggregations": [
-                {
-                    "type": "count",
-                    "name": "rows"
-                },
-                {
-                    "type": "longSum",
-                    "fieldName": "count",
-                    "name": "count"
-                },
-                {
-                    "type": "doubleSum",
-                    "fieldName": "added",
-                    "name": "added"
-                },
-                {
-                    "type": "doubleSum",
-                    "fieldName": "deleted",
-                    "name": "deleted"
-                },
-                {
-                    "type": "doubleSum",
-                    "fieldName": "delta",
-                    "name": "delta"
-                }
-            ],
-            "context": {
-                "useCache": "true",
-                "populateCache": "true",
-                "timeout": 60000
-            }
-        },
-        "expectedResults": [
-            {
-                "timestamp": "2013-08-31T01:02:33.000Z",
-                "result": {
-                    "added": 1548.0,
-                    "count": 6,
-                    "delta": 561.0,
-                    "deleted": 987.0,
-                    "rows": 6
-                }
-            }
-        ]
-    },
-    {
-        "description": "topN, all aggs, page dim, uniques metric",
-        "query": {
-            "queryType": "topN",
-            "dataSource": {
-                "type": "union",
-                "dataSources": [
-                    "%%DATASOURCE%%1", "%%DATASOURCE%%2", "%%DATASOURCE%%3",
-                    "%%DATASOURCE%%0"
-                ]
-            },
-            "intervals": ["2013-08-31/2013-09-01"],
-            "granularity": "all",
-            "aggregations": [
-                {
-                    "type": "count",
-                    "name": "rows"
-                },
-                {
-                    "type": "longSum",
-                    "fieldName": "count",
-                    "name": "count"
-                },
-                {
-                    "type": "doubleSum",
-                    "fieldName": "added",
-                    "name": "added"
-                },
-                {
-                    "type": "doubleSum",
-                    "fieldName": "deleted",
-                    "name": "deleted"
-                },
-                {
-                    "type": "doubleSum",
-                    "fieldName": "delta",
-                    "name": "delta"
-                }
-            ],
-            "dimension": "page",
-            "metric": "added",
-            "threshold": 3,
-            "context": {
-                "useCache": "true",
-                "populateCache": "true",
-                "timeout": 60000
-            }
-        },
-        "expectedResults": [
-            {
-                "timestamp": "2013-08-31T01:02:33.000Z",
-                "result": [
-                    {
-                        "added": 2715.0,
-                        "count": 3,
-                        "page": "Crimson Typhoon",
-                        "delta": 2700.0,
-                        "deleted": 15.0,
-                        "rows": 3
-                    },
-                    {
-                        "added": 1377.0,
-                        "count": 3,
-                        "page": "Striker Eureka",
-                        "delta": 990.0,
-                        "deleted": 387.0,
-                        "rows": 3
-                    },
-                    {
-                        "added": 369.0,
-                        "count": 3,
-                        "page": "Cherno Alpha",
-                        "delta": 333.0,
-                        "deleted": 36.0,
-                        "rows": 3
-                    }
-                ]
-            }
-        ]
-    },
-    {
-        "description": "topN, all aggs, page dim, count metric, postAggs",
-        "query": {
-            "queryType": "topN",
-            "dataSource": {
-                "type": "union",
-                "dataSources": [
-                    "%%DATASOURCE%%1", "%%DATASOURCE%%2", "%%DATASOURCE%%3",
-                    "%%DATASOURCE%%0"
-                ]
-            },
-            "intervals": ["2013-08-31/2013-09-01"],
-            "granularity": "all",
-            "aggregations": [
-                {
-                    "type": "count",
-                    "name": "rows"
-                },
-                {
-                    "type": "longSum",
-                    "fieldName": "count",
-                    "name": "count"
-                },
-                {
-                    "type": "doubleSum",
-                    "fieldName": "added",
-                    "name": "added"
-                },
-                {
-                    "type": "doubleSum",
-                    "fieldName": "deleted",
-                    "name": "deleted"
-                },
-                {
-                    "type": "doubleSum",
-                    "fieldName": "delta",
-                    "name": "delta"
-                }
-            ],
-            "postAggregations": [
-                {
-                    "type": "arithmetic",
-                    "name": "sumOfAddedDeletedConst",
-                    "fn": "+",
-                    "fields": [
-                        {
-                            "type": "fieldAccess",
-                            "name": "added",
-                            "fieldName": "added"
-                        },
-                        {
-                            "type": "arithmetic",
-                            "name": "",
-                            "fn": "+",
-                            "fields": [
-                                {
-                                    "type": "fieldAccess",
-                                    "name": "deleted",
-                                    "fieldName": "deleted"
-                                },
-                                {
-                                    "type": "constant",
-                                    "name": "constant",
-                                    "value": 1000
-                                }
-                            ]
-                        }
-                    ]
-                }
-            ],
-            "dimension": "page",
-            "metric": "added",
-            "threshold": 3,
-            "context": {
-                "useCache": "true",
-                "populateCache": "true",
-                "timeout": 60000
-            }
-        },
-        "expectedResults": [
-            {
-                "timestamp": "2013-08-31T01:02:33.000Z",
-                "result": [
-                    {
-                        "added": 2715.0,
-                        "count": 3,
-                        "page": "Crimson Typhoon",
-                        "delta": 2700.0,
-                        "deleted": 15.0,
-                        "sumOfAddedDeletedConst": 3730.0,
-                        "rows": 3
-                    },
-                    {
-                        "added": 1377.0,
-                        "count": 3,
-                        "page": "Striker Eureka",
-                        "delta": 990.0,
-                        "deleted": 387.0,
-                        "sumOfAddedDeletedConst": 2764.0,
-                        "rows": 3
-                    },
-                    {
-                        "added": 369.0,
-                        "count": 3,
-                        "page": "Cherno Alpha",
-                        "delta": 333.0,
-                        "deleted": 36.0,
-                        "sumOfAddedDeletedConst": 1405.0,
-                        "rows": 3
-                    }
-                ]
-            }
-        ]
-    },
-    {
-        "description": "topN, lexicographic, two aggs, language dim, postAggs",
-        "query": {
-            "queryType": "topN",
-            "dataSource": {
-                "type": "union",
-                "dataSources": [
-                    "%%DATASOURCE%%1", "%%DATASOURCE%%2", "%%DATASOURCE%%3",
-                    "%%DATASOURCE%%0"
-                ]
-            },
-            "intervals": ["2013-08-31/2013-09-01"],
-            "granularity": "all",
-            "aggregations": [
-                {
-                    "type": "count",
-                    "name": "rows"
-                },
-                {
-                    "type": "longSum",
-                    "fieldName": "count",
-                    "name": "count"
-                }
-            ],
-            "postAggregations": [
-                {
-                    "type": "arithmetic",
-                    "name": "sumOfRowsAndCount",
-                    "fn": "+",
-                    "fields": [
-                        {
-                            "type": "fieldAccess",
-                            "name": "rows",
-                            "fieldName": "rows"
-                        },
-                        {
-                            "type": "fieldAccess",
-                            "name": "count",
-                            "fieldName": "count"
-                        }
-                    ]
-                }
-            ],
-            "dimension": "language",
-            "metric": {
-                "type": "lexicographic",
-                "previousStop": "a"
-            },
-            "threshold": 3,
-            "context": {
-                "useCache": "true",
-                "populateCache": "true",
-                "timeout": 60000
-            }
-        },
-        "expectedResults": [
-            {
-                "timestamp": "2013-08-31T01:02:33.000Z",
-                "result": [
-                    {
-                        "sumOfRowsAndCount": 12.0,
-                        "count": 6,
-                        "language": "en",
-                        "rows": 6
-                    },
-                    {
-                        "sumOfRowsAndCount": 6.0,
-                        "count": 3,
-                        "language": "ja",
-                        "rows": 3
-                    },
-                    {
-                        "sumOfRowsAndCount": 6.0,
-                        "count": 3,
-                        "language": "ru",
-                        "rows": 3
-                    }
-                ]
-            }
-        ]
-    },
-    {
-        "description": "groupBy, two aggs, namespace dim, postAggs",
-        "query": {
-            "queryType": "groupBy",
-            "dataSource": {
-                "type": "union",
-                "dataSources": [
-                    "%%DATASOURCE%%1", "%%DATASOURCE%%2", "%%DATASOURCE%%3",
-                    "%%DATASOURCE%%0"
-                ]
-            },
-            "intervals": ["2013-08-31/2013-09-01"],
-            "granularity": "all",
-            "aggregations": [
-                {
-                    "type": "count",
-                    "name": "rows"
-                },
-                {
-                    "type": "longSum",
-                    "fieldName": "count",
-                    "name": "count"
-                }
-            ],
-            "postAggregations": [
-                {
-                    "type": "arithmetic",
-                    "name": "sumOfRowsAndCount",
-                    "fn": "+",
-                    "fields": [
-                        {
-                            "type": "fieldAccess",
-                            "name": "rows",
-                            "fieldName": "rows"
-                        },
-                        {
-                            "type": "fieldAccess",
-                            "name": "count",
-                            "fieldName": "count"
-                        }
-                    ]
-                }
-            ],
-            "dimensions": ["namespace"],
-            "context": {
-                "useCache": "true",
-                "populateCache": "true",
-                "timeout": 60000
-            }
-        },
-        "expectedResults": [
-            {
-                "version": "v1",
-                "timestamp": "2013-08-31T00:00:00.000Z",
-                "event": {
-                    "sumOfRowsAndCount": 12.0,
-                    "count": 6,
-                    "rows": 6,
-                    "namespace": "article"
-                }
-            },
-            {
-                "version": "v1",
-                "timestamp": "2013-08-31T00:00:00.000Z",
-                "event": {
-                    "sumOfRowsAndCount": 18.0,
-                    "count": 9,
-                    "rows": 9,
-                    "namespace": "wikipedia"
-                }
-            }
-        ]
-    },
-    {
-        "description": "groupBy, two aggs, namespace + robot dim, postAggs",
-        "query": {
-            "queryType": "groupBy",
-            "dataSource": {
-                "type": "union",
-                "dataSources": [
-                    "%%DATASOURCE%%1", "%%DATASOURCE%%2", "%%DATASOURCE%%3",
-                    "%%DATASOURCE%%0"
-                ]
-            },
-            "intervals": ["2013-08-31/2013-09-01"],
-            "granularity": "all",
-            "aggregations": [
-                {
-                    "type": "count",
-                    "name": "rows"
-                },
-                {
-                    "type": "longSum",
-                    "fieldName": "count",
-                    "name": "count"
-                }
-            ],
-            "postAggregations": [
-                {
-                    "type": "arithmetic",
-                    "name": "sumOfRowsAndCount",
-                    "fn": "+",
-                    "fields": [
-                        {
-                            "type": "fieldAccess",
-                            "name": "rows",
-                            "fieldName": "rows"
-                        },
-                        {
-                            "type": "fieldAccess",
-                            "name": "count",
-                            "fieldName": "count"
-                        }
-                    ]
-                }
-            ],
-            "dimensions": ["namespace", "robot"],
-            "limitSpec": {
-                "type": "default",
-                "limit": 3,
-                "orderBy": ["robot", "namespace"]
-            },
-            "context": {
-                "useCache": "true",
-                "populateCache": "true",
-                "timeout": 60000
-            }
-        },
-        "expectedResults": [
-            {
-                "version": "v1",
-                "timestamp": "2013-08-31T00:00:00.000Z",
-                "event": {
-                    "sumOfRowsAndCount": 6.0,
-                    "count": 3,
-                    "robot": "false",
-                    "rows": 3,
-                    "namespace": "article"
-                }
-            },
-            {
-                "version": "v1",
-                "timestamp": "2013-08-31T00:00:00.000Z",
-                "event": {
-                    "sumOfRowsAndCount": 6.0,
-                    "count": 3,
-                    "robot": "true",
-                    "rows": 3,
-                    "namespace": "article"
-                }
-            },
-            {
-                "version": "v1",
-                "timestamp": "2013-08-31T00:00:00.000Z",
-                "event": {
-                    "sumOfRowsAndCount": 18.0,
-                    "count": 9,
-                    "robot": "true",
-                    "rows": 9,
-                    "namespace": "wikipedia"
-                }
-            }
-        ]
-    },
-    {
-        "query": {
-            "queryType": "search",
-            "intervals": ["2013-08-31/2013-09-01"],
-            "dataSource": {
-                "type": "union",
-                "dataSources": [
-                    "%%DATASOURCE%%1", "%%DATASOURCE%%2", "%%DATASOURCE%%3",
-                    "%%DATASOURCE%%0"
-                ]
-            },
-            "granularity": "all",
-            "query": {
-                "type": "insensitive_contains",
-                "value": "ip"
-            },
-            "context": {
-                "useCache": "true",
-                "populateCache": "true",
-                "timeout": 60000
-            }
-        },
-        "expectedResults": [
-            {
-                "timestamp": "2013-08-31T00:00:00.000Z",
-                "result": [
-                    {
-                        "dimension": "user",
-                        "value": "triplets",
-			"count":3
-                    },
-                    {
-                        "dimension": "namespace",
-                        "value": "wikipedia",
-			"count":9
-                    }
-                ]
-            }
-        ]
-    },
-    {
-        "description": "timeboundary, 1 agg, union",
-        "query": {
-            "queryType": "timeBoundary",
-            "dataSource": {
-                "type": "union",
-                "dataSources": [
-                    "%%DATASOURCE%%1", "%%DATASOURCE%%2", "%%DATASOURCE%%3",
-                    "%%DATASOURCE%%0"
-                ]
-            }
-        },
-        "expectedResults": [
-            {
-                "timestamp": "2013-08-31T01:02:33.000Z",
-                "result": {
-                    "minTime": "2013-08-31T01:02:33.000Z",
-                    "maxTime": "2013-09-01T12:41:27.000Z"
-                }
-            }
-        ]
-    }
-]
diff --git a/processing/src/main/java/org/apache/druid/common/guava/ThreadRenamingCallable.java b/processing/src/main/java/org/apache/druid/common/guava/ThreadRenamingCallable.java
deleted file mode 100644
index 491d3890a57..00000000000
--- a/processing/src/main/java/org/apache/druid/common/guava/ThreadRenamingCallable.java
+++ /dev/null
@@ -1,50 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.common.guava;
-
-import java.util.concurrent.Callable;
-
-public abstract class ThreadRenamingCallable<T> implements Callable<T>
-{
-  private final String name;
-
-  public ThreadRenamingCallable(
-      String name
-  )
-  {
-    this.name = name;
-  }
-
-  @Override
-  public final T call()
-  {
-    final Thread currThread = Thread.currentThread();
-    String currName = currThread.getName();
-    try {
-      currThread.setName(name);
-      return doCall();
-    }
-    finally {
-      currThread.setName(currName);
-    }
-  }
-
-  public abstract T doCall();
-}
diff --git a/processing/src/main/java/org/apache/druid/java/util/common/concurrent/ScheduledExecutors.java b/processing/src/main/java/org/apache/druid/java/util/common/concurrent/ScheduledExecutors.java
index 97f43f6c9b9..72cdaf15edf 100644
--- a/processing/src/main/java/org/apache/druid/java/util/common/concurrent/ScheduledExecutors.java
+++ b/processing/src/main/java/org/apache/druid/java/util/common/concurrent/ScheduledExecutors.java
@@ -64,16 +64,6 @@ public class ScheduledExecutors
     );
   }
 
-  /**
-   * Run callable repeatedly with the given delay between calls, after the given
-   * initial delay, until it returns Signal.STOP. Exceptions are caught and
-   * logged as errors.
-   */
-  public static void scheduleWithFixedDelay(ScheduledExecutorService exec, Duration delay, Callable<Signal> callable)
-  {
-    scheduleWithFixedDelay(exec, delay, delay, callable);
-  }
-
   /**
    * Run callable repeatedly with the given delay between calls, until it
    * returns Signal.STOP. Exceptions are caught and logged as errors.
diff --git a/processing/src/main/java/org/apache/druid/query/filter/SelectorDimFilter.java b/processing/src/main/java/org/apache/druid/query/filter/SelectorDimFilter.java
index 05cd4730e4b..019862e5014 100644
--- a/processing/src/main/java/org/apache/druid/query/filter/SelectorDimFilter.java
+++ b/processing/src/main/java/org/apache/druid/query/filter/SelectorDimFilter.java
@@ -34,7 +34,6 @@ import org.apache.druid.segment.filter.DimensionPredicateFilter;
 import org.apache.druid.segment.filter.SelectorFilter;
 
 import javax.annotation.Nullable;
-
 import java.util.Objects;
 import java.util.Set;
 
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java
index a2fc9cec8a6..7b28f782e31 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java
@@ -55,7 +55,6 @@ import org.joda.time.DateTime;
 import org.joda.time.Interval;
 
 import javax.annotation.Nullable;
-
 import java.io.IOException;
 import java.nio.ByteBuffer;
 import java.util.Collections;
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/semantic/DefaultFramedOnHeapAggregatable.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/semantic/DefaultFramedOnHeapAggregatable.java
index 19bc6170c12..83952873050 100644
--- a/processing/src/main/java/org/apache/druid/query/rowsandcols/semantic/DefaultFramedOnHeapAggregatable.java
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/semantic/DefaultFramedOnHeapAggregatable.java
@@ -39,7 +39,6 @@ import org.apache.druid.segment.column.ColumnCapabilitiesImpl;
 
 import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
-
 import java.util.Arrays;
 import java.util.Iterator;
 import java.util.concurrent.atomic.AtomicInteger;
diff --git a/processing/src/main/java/org/apache/druid/segment/Metadata.java b/processing/src/main/java/org/apache/druid/segment/Metadata.java
index e8aa5e646de..e6b5b1f6588 100644
--- a/processing/src/main/java/org/apache/druid/segment/Metadata.java
+++ b/processing/src/main/java/org/apache/druid/segment/Metadata.java
@@ -108,11 +108,6 @@ public class Metadata
     return this;
   }
 
-  public Object get(String key)
-  {
-    return container.get(key);
-  }
-
   // arbitrary key-value pairs from the metadata just follow the semantics of last one wins if same
   // key exists in multiple input Metadata containers
   // for others e.g. Aggregators, appropriate merging is done
diff --git a/processing/src/main/java/org/apache/druid/segment/incremental/IncrementalIndexAddResult.java b/processing/src/main/java/org/apache/druid/segment/incremental/IncrementalIndexAddResult.java
index 077f162f9da..5f84138495c 100644
--- a/processing/src/main/java/org/apache/druid/segment/incremental/IncrementalIndexAddResult.java
+++ b/processing/src/main/java/org/apache/druid/segment/incremental/IncrementalIndexAddResult.java
@@ -97,10 +97,4 @@ public class IncrementalIndexAddResult
   {
     return reasonOfNotAdded == null && parseException == null;
   }
-
-  @Nullable
-  public String getReasonOfNotAdded()
-  {
-    return reasonOfNotAdded;
-  }
 }
diff --git a/processing/src/main/java/org/apache/druid/segment/incremental/RowIngestionMeters.java b/processing/src/main/java/org/apache/druid/segment/incremental/RowIngestionMeters.java
index 3085376b822..25fc3bae481 100644
--- a/processing/src/main/java/org/apache/druid/segment/incremental/RowIngestionMeters.java
+++ b/processing/src/main/java/org/apache/druid/segment/incremental/RowIngestionMeters.java
@@ -26,8 +26,8 @@ import java.util.Map;
 
 /**
  * A collection of meters for row ingestion stats, with support for moving average calculations.
- * This can eventually replace FireDepartmentMetrics, but moving averages for other stats collected by
- * FireDepartmentMetrics are not currently supported, so we continue to use FireDepartmentMetrics alongside
+ * This can eventually replace SegmentGenerationMetrics, but moving averages for other stats collected by
+ * SegmentGenerationMetrics are not currently supported, so we continue to use SegmentGenerationMetrics alongside
  * RowIngestionMeters to avoid unnecessary overhead from maintaining these moving averages.
  */
 @ExtensionPoint
diff --git a/processing/src/test/java/org/apache/druid/query/rowsandcols/RowsAndColumnsTestBase.java b/processing/src/test/java/org/apache/druid/query/rowsandcols/RowsAndColumnsTestBase.java
index 281527b3d1e..56be3d50f20 100644
--- a/processing/src/test/java/org/apache/druid/query/rowsandcols/RowsAndColumnsTestBase.java
+++ b/processing/src/test/java/org/apache/druid/query/rowsandcols/RowsAndColumnsTestBase.java
@@ -28,7 +28,6 @@ import org.junit.Assert;
 import org.junit.Test;
 
 import javax.annotation.Nonnull;
-
 import java.util.ArrayList;
 import java.util.concurrent.atomic.AtomicReference;
 import java.util.function.Function;
diff --git a/processing/src/test/java/org/apache/druid/query/rowsandcols/concrete/ColumnBasedFrameRowsAndColumnsTest.java b/processing/src/test/java/org/apache/druid/query/rowsandcols/concrete/ColumnBasedFrameRowsAndColumnsTest.java
index 3cb3c5772b3..cd1bb1b81ec 100644
--- a/processing/src/test/java/org/apache/druid/query/rowsandcols/concrete/ColumnBasedFrameRowsAndColumnsTest.java
+++ b/processing/src/test/java/org/apache/druid/query/rowsandcols/concrete/ColumnBasedFrameRowsAndColumnsTest.java
@@ -23,6 +23,7 @@ import org.apache.druid.query.operator.OffsetLimit;
 import org.apache.druid.query.rowsandcols.LazilyDecoratedRowsAndColumns;
 import org.apache.druid.query.rowsandcols.MapOfColumnsRowsAndColumns;
 import org.apache.druid.query.rowsandcols.RowsAndColumnsTestBase;
+
 import java.util.function.Function;
 
 public class ColumnBasedFrameRowsAndColumnsTest extends RowsAndColumnsTestBase
diff --git a/server/src/main/java/org/apache/druid/guice/NoopSegmentPublisherProvider.java b/server/src/main/java/org/apache/druid/guice/NoopSegmentPublisherProvider.java
deleted file mode 100644
index 254f2ca2823..00000000000
--- a/server/src/main/java/org/apache/druid/guice/NoopSegmentPublisherProvider.java
+++ /dev/null
@@ -1,35 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.guice;
-
-import org.apache.druid.metadata.SegmentPublisherProvider;
-import org.apache.druid.segment.realtime.NoopSegmentPublisher;
-import org.apache.druid.segment.realtime.SegmentPublisher;
-
-/**
- */
-public class NoopSegmentPublisherProvider implements SegmentPublisherProvider
-{
-  @Override
-  public SegmentPublisher get()
-  {
-    return new NoopSegmentPublisher();
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/guice/SQLMetadataStorageDruidModule.java b/server/src/main/java/org/apache/druid/guice/SQLMetadataStorageDruidModule.java
index 7ece79ad40f..7894df83af4 100644
--- a/server/src/main/java/org/apache/druid/guice/SQLMetadataStorageDruidModule.java
+++ b/server/src/main/java/org/apache/druid/guice/SQLMetadataStorageDruidModule.java
@@ -29,8 +29,6 @@ import org.apache.druid.indexing.overlord.IndexerMetadataStorageCoordinator;
 import org.apache.druid.metadata.IndexerSQLMetadataStorageCoordinator;
 import org.apache.druid.metadata.MetadataRuleManager;
 import org.apache.druid.metadata.MetadataRuleManagerProvider;
-import org.apache.druid.metadata.MetadataSegmentPublisher;
-import org.apache.druid.metadata.MetadataSegmentPublisherProvider;
 import org.apache.druid.metadata.MetadataStorageActionHandlerFactory;
 import org.apache.druid.metadata.MetadataStorageConnector;
 import org.apache.druid.metadata.MetadataStorageProvider;
@@ -38,8 +36,6 @@ import org.apache.druid.metadata.MetadataSupervisorManager;
 import org.apache.druid.metadata.SQLMetadataConnector;
 import org.apache.druid.metadata.SQLMetadataRuleManager;
 import org.apache.druid.metadata.SQLMetadataRuleManagerProvider;
-import org.apache.druid.metadata.SQLMetadataSegmentPublisher;
-import org.apache.druid.metadata.SQLMetadataSegmentPublisherProvider;
 import org.apache.druid.metadata.SQLMetadataSupervisorManager;
 import org.apache.druid.metadata.SegmentsMetadataManager;
 import org.apache.druid.metadata.SegmentsMetadataManagerProvider;
@@ -76,8 +72,6 @@ public class SQLMetadataStorageDruidModule implements Module
     PolyBind.createChoiceWithDefault(binder, prop, Key.get(SegmentsMetadataManagerProvider.class), defaultValue);
     PolyBind.createChoiceWithDefault(binder, prop, Key.get(MetadataRuleManager.class), defaultValue);
     PolyBind.createChoiceWithDefault(binder, prop, Key.get(MetadataRuleManagerProvider.class), defaultValue);
-    PolyBind.createChoiceWithDefault(binder, prop, Key.get(MetadataSegmentPublisher.class), defaultValue);
-    PolyBind.createChoiceWithDefault(binder, prop, Key.get(MetadataSegmentPublisherProvider.class), defaultValue);
     PolyBind.createChoiceWithDefault(binder, prop, Key.get(IndexerMetadataStorageCoordinator.class), defaultValue);
     PolyBind.createChoiceWithDefault(binder, prop, Key.get(MetadataStorageActionHandlerFactory.class), defaultValue);
     PolyBind.createChoiceWithDefault(binder, prop, Key.get(MetadataStorageUpdaterJobHandler.class), defaultValue);
@@ -109,16 +103,6 @@ public class SQLMetadataStorageDruidModule implements Module
             .to(SQLMetadataRuleManagerProvider.class)
             .in(LazySingleton.class);
 
-    PolyBind.optionBinder(binder, Key.get(MetadataSegmentPublisher.class))
-            .addBinding(type)
-            .to(SQLMetadataSegmentPublisher.class)
-            .in(LazySingleton.class);
-
-    PolyBind.optionBinder(binder, Key.get(MetadataSegmentPublisherProvider.class))
-            .addBinding(type)
-            .to(SQLMetadataSegmentPublisherProvider.class)
-            .in(LazySingleton.class);
-
     PolyBind.optionBinder(binder, Key.get(IndexerMetadataStorageCoordinator.class))
             .addBinding(type)
             .to(IndexerSQLMetadataStorageCoordinator.class)
diff --git a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
index c02bba6082c..9452d19485f 100644
--- a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
@@ -204,7 +204,7 @@ public interface IndexerMetadataStorageCoordinator
    *
    * @return set of segments actually added
    */
-  Set<DataSegment> commitSegments(Set<DataSegment> segments, @Nullable SegmentSchemaMapping segmentSchemaMapping) throws IOException;
+  Set<DataSegment> commitSegments(Set<DataSegment> segments, @Nullable SegmentSchemaMapping segmentSchemaMapping);
 
   /**
    * Allocates pending segments for the given requests in the pending segments table.
@@ -316,7 +316,7 @@ public interface IndexerMetadataStorageCoordinator
       @Nullable DataSourceMetadata startMetadata,
       @Nullable DataSourceMetadata endMetadata,
       @Nullable SegmentSchemaMapping segmentSchemaMapping
-  ) throws IOException;
+  );
 
   /**
    * Commits segments and corresponding schema created by an APPEND task.
diff --git a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
index 72367330232..75d296923fb 100644
--- a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
@@ -450,7 +450,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
   public Set<DataSegment> commitSegments(
       final Set<DataSegment> segments,
       @Nullable final SegmentSchemaMapping segmentSchemaMapping
-  ) throws IOException
+  )
   {
     final SegmentPublishResult result =
         commitSegmentsAndMetadata(
@@ -474,7 +474,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
       @Nullable final DataSourceMetadata startMetadata,
       @Nullable final DataSourceMetadata endMetadata,
       @Nullable final SegmentSchemaMapping segmentSchemaMapping
-  ) throws IOException
+  )
   {
     verifySegmentsToCommit(segments);
 
diff --git a/server/src/main/java/org/apache/druid/metadata/MetadataSegmentPublisherProvider.java b/server/src/main/java/org/apache/druid/metadata/MetadataSegmentPublisherProvider.java
deleted file mode 100644
index b493148ec90..00000000000
--- a/server/src/main/java/org/apache/druid/metadata/MetadataSegmentPublisherProvider.java
+++ /dev/null
@@ -1,26 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.metadata;
-
-public interface MetadataSegmentPublisherProvider extends SegmentPublisherProvider
-{
-  @Override
-  MetadataSegmentPublisher get();
-}
diff --git a/server/src/main/java/org/apache/druid/metadata/SQLMetadataSegmentPublisher.java b/server/src/main/java/org/apache/druid/metadata/SQLMetadataSegmentPublisher.java
deleted file mode 100644
index 48a92ecba4e..00000000000
--- a/server/src/main/java/org/apache/druid/metadata/SQLMetadataSegmentPublisher.java
+++ /dev/null
@@ -1,126 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.metadata;
-
-import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.inject.Inject;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.timeline.DataSegment;
-import org.apache.druid.timeline.partition.NoneShardSpec;
-import org.skife.jdbi.v2.DBI;
-
-import java.io.IOException;
-import java.util.List;
-import java.util.Map;
-
-public class SQLMetadataSegmentPublisher implements MetadataSegmentPublisher
-{
-  private static final Logger log = new Logger(SQLMetadataSegmentPublisher.class);
-
-  private final ObjectMapper jsonMapper;
-  private final MetadataStorageTablesConfig config;
-  private final SQLMetadataConnector connector;
-  private final String statement;
-
-  @Inject
-  public SQLMetadataSegmentPublisher(
-      ObjectMapper jsonMapper,
-      MetadataStorageTablesConfig config,
-      SQLMetadataConnector connector
-  )
-  {
-    this.jsonMapper = jsonMapper;
-    this.config = config;
-    this.connector = connector;
-    this.statement = StringUtils.format(
-        "INSERT INTO %1$s (id, dataSource, created_date, start, %2$send%2$s, partitioned, version, used, payload, used_status_last_updated) "
-        + "VALUES (:id, :dataSource, :created_date, :start, :end, :partitioned, :version, :used, :payload, :used_status_last_updated)",
-        config.getSegmentsTable(), connector.getQuoteString()
-    );
-  }
-
-  @Override
-  public void publishSegment(final DataSegment segment) throws IOException
-  {
-    String now = DateTimes.nowUtc().toString();
-    publishSegment(
-        segment.getId().toString(),
-        segment.getDataSource(),
-        now,
-        segment.getInterval().getStart().toString(),
-        segment.getInterval().getEnd().toString(),
-        (segment.getShardSpec() instanceof NoneShardSpec) ? false : true,
-        segment.getVersion(),
-        true,
-        jsonMapper.writeValueAsBytes(segment),
-        now
-    );
-  }
-
-  private void publishSegment(
-      final String segmentId,
-      final String dataSource,
-      final String createdDate,
-      final String start,
-      final String end,
-      final boolean partitioned,
-      final String version,
-      final boolean used,
-      final byte[] payload,
-      final String usedFlagLastUpdated
-  )
-  {
-    try {
-      final DBI dbi = connector.getDBI();
-      List<Map<String, Object>> exists = dbi.withHandle(
-          handle -> handle.createQuery(
-              StringUtils.format("SELECT id FROM %s WHERE id=:id", config.getSegmentsTable())
-          ).bind("id", segmentId).list()
-      );
-
-      if (!exists.isEmpty()) {
-        log.info("Skipping publish of segment[%s] as it already exists in the metadata store.", segmentId);
-        return;
-      }
-
-      dbi.withHandle(
-          handle ->
-              handle.createStatement(statement)
-                    .bind("id", segmentId)
-                    .bind("dataSource", dataSource)
-                    .bind("created_date", createdDate)
-                    .bind("start", start)
-                    .bind("end", end)
-                    .bind("partitioned", partitioned)
-                    .bind("version", version)
-                    .bind("used", used)
-                    .bind("payload", payload)
-                    .bind("used_status_last_updated", usedFlagLastUpdated)
-                    .execute()
-      );
-    }
-    catch (Exception e) {
-      log.error(e, "Exception inserting into DB");
-      throw new RuntimeException(e);
-    }
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/metadata/SQLMetadataSegmentPublisherProvider.java b/server/src/main/java/org/apache/druid/metadata/SQLMetadataSegmentPublisherProvider.java
deleted file mode 100644
index 89ba4bf9bc7..00000000000
--- a/server/src/main/java/org/apache/druid/metadata/SQLMetadataSegmentPublisherProvider.java
+++ /dev/null
@@ -1,48 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.metadata;
-
-import com.fasterxml.jackson.annotation.JacksonInject;
-import com.fasterxml.jackson.databind.ObjectMapper;
-
-import javax.validation.constraints.NotNull;
-
-/**
- */
-public class SQLMetadataSegmentPublisherProvider implements MetadataSegmentPublisherProvider
-{
-  @JacksonInject
-  @NotNull
-  private SQLMetadataConnector connector = null;
-
-  @JacksonInject
-  @NotNull
-  private MetadataStorageTablesConfig config = null;
-
-  @JacksonInject
-  @NotNull
-  private ObjectMapper jsonMapper = null;
-
-  @Override
-  public MetadataSegmentPublisher get()
-  {
-    return new SQLMetadataSegmentPublisher(jsonMapper, config, connector);
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/metadata/SegmentPublisherProvider.java b/server/src/main/java/org/apache/druid/metadata/SegmentPublisherProvider.java
deleted file mode 100644
index c33c3a826f2..00000000000
--- a/server/src/main/java/org/apache/druid/metadata/SegmentPublisherProvider.java
+++ /dev/null
@@ -1,36 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.metadata;
-
-import com.fasterxml.jackson.annotation.JsonSubTypes;
-import com.fasterxml.jackson.annotation.JsonTypeInfo;
-import com.google.inject.Provider;
-import org.apache.druid.guice.NoopSegmentPublisherProvider;
-import org.apache.druid.segment.realtime.SegmentPublisher;
-
-/**
- */
-@JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type", defaultImpl = NoopSegmentPublisherProvider.class)
-@JsonSubTypes(value = {
-    @JsonSubTypes.Type(name = "metadata", value = MetadataSegmentPublisherProvider.class)
-})
-public interface SegmentPublisherProvider extends Provider<SegmentPublisher>
-{
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/NoopSegmentHandoffNotifierFactory.java b/server/src/main/java/org/apache/druid/segment/handoff/NoopSegmentHandoffNotifierFactory.java
similarity index 90%
rename from server/src/main/java/org/apache/druid/segment/realtime/plumber/NoopSegmentHandoffNotifierFactory.java
rename to server/src/main/java/org/apache/druid/segment/handoff/NoopSegmentHandoffNotifierFactory.java
index 9a51143d64b..bd04aa60839 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/NoopSegmentHandoffNotifierFactory.java
+++ b/server/src/main/java/org/apache/druid/segment/handoff/NoopSegmentHandoffNotifierFactory.java
@@ -17,12 +17,10 @@
  * under the License.
  */
 
-package org.apache.druid.segment.realtime.plumber;
+package org.apache.druid.segment.handoff;
 
 import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.query.SegmentDescriptor;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
 
 import java.util.concurrent.Executor;
 
diff --git a/server/src/main/java/org/apache/druid/segment/indexing/IOConfig.java b/server/src/main/java/org/apache/druid/segment/indexing/IOConfig.java
index b1784806e7e..9a783980a42 100644
--- a/server/src/main/java/org/apache/druid/segment/indexing/IOConfig.java
+++ b/server/src/main/java/org/apache/druid/segment/indexing/IOConfig.java
@@ -19,15 +19,11 @@
 
 package org.apache.druid.segment.indexing;
 
-import com.fasterxml.jackson.annotation.JsonSubTypes;
 import com.fasterxml.jackson.annotation.JsonTypeInfo;
 
 /**
  */
 @JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type")
-@JsonSubTypes(value = {
-    @JsonSubTypes.Type(name = "realtime", value = RealtimeIOConfig.class)
-})
 public interface IOConfig
 {
 }
diff --git a/server/src/main/java/org/apache/druid/segment/indexing/RealtimeIOConfig.java b/server/src/main/java/org/apache/druid/segment/indexing/RealtimeIOConfig.java
deleted file mode 100644
index ba8eff09d1e..00000000000
--- a/server/src/main/java/org/apache/druid/segment/indexing/RealtimeIOConfig.java
+++ /dev/null
@@ -1,54 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.indexing;
-
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import org.apache.druid.data.input.FirehoseFactory;
-import org.apache.druid.segment.realtime.plumber.PlumberSchool;
-
-/**
- */
-public class RealtimeIOConfig implements IOConfig
-{
-  private final FirehoseFactory firehoseFactory;
-  private final PlumberSchool plumberSchool;
-
-  @JsonCreator
-  public RealtimeIOConfig(
-      @JsonProperty("firehose") FirehoseFactory firehoseFactory,
-      @JsonProperty("plumber") PlumberSchool plumberSchool
-  )
-  {
-    this.firehoseFactory = firehoseFactory;
-    this.plumberSchool = plumberSchool;
-  }
-
-  @JsonProperty("firehose")
-  public FirehoseFactory getFirehoseFactory()
-  {
-    return firehoseFactory;
-  }
-
-  public PlumberSchool getPlumberSchool()
-  {
-    return plumberSchool;
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/indexing/RealtimeTuningConfig.java b/server/src/main/java/org/apache/druid/segment/indexing/RealtimeTuningConfig.java
deleted file mode 100644
index a75a79b4dd9..00000000000
--- a/server/src/main/java/org/apache/druid/segment/indexing/RealtimeTuningConfig.java
+++ /dev/null
@@ -1,420 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.indexing;
-
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import com.google.common.base.Preconditions;
-import org.apache.druid.indexer.partitions.PartitionsSpec;
-import org.apache.druid.segment.IndexSpec;
-import org.apache.druid.segment.incremental.AppendableIndexSpec;
-import org.apache.druid.segment.realtime.appenderator.AppenderatorConfig;
-import org.apache.druid.segment.realtime.plumber.IntervalStartVersioningPolicy;
-import org.apache.druid.segment.realtime.plumber.RejectionPolicyFactory;
-import org.apache.druid.segment.realtime.plumber.ServerTimeRejectionPolicyFactory;
-import org.apache.druid.segment.realtime.plumber.VersioningPolicy;
-import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
-import org.apache.druid.timeline.partition.NumberedShardSpec;
-import org.apache.druid.timeline.partition.ShardSpec;
-import org.joda.time.Period;
-
-import javax.annotation.Nullable;
-import java.io.File;
-import java.time.Duration;
-
-/**
- *
- */
-public class RealtimeTuningConfig implements AppenderatorConfig
-{
-  private static final Period DEFAULT_INTERMEDIATE_PERSIST_PERIOD = new Period("PT10M");
-  private static final Period DEFAULT_WINDOW_PERIOD = new Period("PT10M");
-  private static final VersioningPolicy DEFAULT_VERSIONING_POLICY = new IntervalStartVersioningPolicy();
-  private static final RejectionPolicyFactory DEFAULT_REJECTION_POLICY_FACTORY = new ServerTimeRejectionPolicyFactory();
-  private static final int DEFAULT_MAX_PENDING_PERSISTS = 0;
-  private static final ShardSpec DEFAULT_SHARD_SPEC = new NumberedShardSpec(0, 1);
-  private static final IndexSpec DEFAULT_INDEX_SPEC = IndexSpec.DEFAULT;
-  private static final Boolean DEFAULT_REPORT_PARSE_EXCEPTIONS = Boolean.FALSE;
-  private static final long DEFAULT_HANDOFF_CONDITION_TIMEOUT = Duration.ofMinutes(15).toMillis();
-  private static final long DEFAULT_ALERT_TIMEOUT = 0;
-  private static final String DEFAULT_DEDUP_COLUMN = null;
-
-  // Might make sense for this to be a builder
-  public static RealtimeTuningConfig makeDefaultTuningConfig(final @Nullable File basePersistDirectory)
-  {
-    return new RealtimeTuningConfig(
-        DEFAULT_APPENDABLE_INDEX,
-        DEFAULT_MAX_ROWS_IN_MEMORY_REALTIME,
-        0L,
-        DEFAULT_SKIP_BYTES_IN_MEMORY_OVERHEAD_CHECK,
-        DEFAULT_INTERMEDIATE_PERSIST_PERIOD,
-        DEFAULT_WINDOW_PERIOD,
-        basePersistDirectory,
-        DEFAULT_VERSIONING_POLICY,
-        DEFAULT_REJECTION_POLICY_FACTORY,
-        DEFAULT_MAX_PENDING_PERSISTS,
-        DEFAULT_SHARD_SPEC,
-        DEFAULT_INDEX_SPEC,
-        DEFAULT_INDEX_SPEC,
-        0,
-        0,
-        DEFAULT_REPORT_PARSE_EXCEPTIONS,
-        DEFAULT_HANDOFF_CONDITION_TIMEOUT,
-        DEFAULT_ALERT_TIMEOUT,
-        null,
-        DEFAULT_DEDUP_COLUMN,
-        DEFAULT_NUM_PERSIST_THREADS
-    );
-  }
-
-  private final AppendableIndexSpec appendableIndexSpec;
-  private final int maxRowsInMemory;
-  private final long maxBytesInMemory;
-  private final boolean skipBytesInMemoryOverheadCheck;
-  private final Period intermediatePersistPeriod;
-  private final Period windowPeriod;
-  private final File basePersistDirectory;
-  private final VersioningPolicy versioningPolicy;
-  private final RejectionPolicyFactory rejectionPolicyFactory;
-  private final int maxPendingPersists;
-  private final ShardSpec shardSpec;
-  private final IndexSpec indexSpec;
-  private final IndexSpec indexSpecForIntermediatePersists;
-  private final int persistThreadPriority;
-  private final int mergeThreadPriority;
-  private final boolean reportParseExceptions;
-  private final long handoffConditionTimeout;
-  private final long alertTimeout;
-  @Nullable
-  private final SegmentWriteOutMediumFactory segmentWriteOutMediumFactory;
-  @Nullable
-  private final String dedupColumn;
-  private final int numPersistThreads;
-
-  public RealtimeTuningConfig(
-      @Nullable AppendableIndexSpec appendableIndexSpec,
-      Integer maxRowsInMemory,
-      Long maxBytesInMemory,
-      @Nullable Boolean skipBytesInMemoryOverheadCheck,
-      Period intermediatePersistPeriod,
-      Period windowPeriod,
-      File basePersistDirectory,
-      VersioningPolicy versioningPolicy,
-      RejectionPolicyFactory rejectionPolicyFactory,
-      Integer maxPendingPersists,
-      ShardSpec shardSpec,
-      IndexSpec indexSpec,
-      @Nullable IndexSpec indexSpecForIntermediatePersists,
-      int persistThreadPriority,
-      int mergeThreadPriority,
-      Boolean reportParseExceptions,
-      Long handoffConditionTimeout,
-      Long alertTimeout,
-      @Nullable SegmentWriteOutMediumFactory segmentWriteOutMediumFactory,
-      @Nullable String dedupColumn,
-      @Nullable Integer numPersistThreads
-  )
-  {
-    this.appendableIndexSpec = appendableIndexSpec == null ? DEFAULT_APPENDABLE_INDEX : appendableIndexSpec;
-    this.maxRowsInMemory = maxRowsInMemory == null ? DEFAULT_MAX_ROWS_IN_MEMORY_REALTIME : maxRowsInMemory;
-    // initializing this to 0, it will be lazily initialized to a value
-    // @see #getMaxBytesInMemoryOrDefault()
-    this.maxBytesInMemory = maxBytesInMemory == null ? 0 : maxBytesInMemory;
-    this.skipBytesInMemoryOverheadCheck = skipBytesInMemoryOverheadCheck == null ?
-                                          DEFAULT_SKIP_BYTES_IN_MEMORY_OVERHEAD_CHECK : skipBytesInMemoryOverheadCheck;
-    this.intermediatePersistPeriod = intermediatePersistPeriod == null
-                                     ? DEFAULT_INTERMEDIATE_PERSIST_PERIOD
-                                     : intermediatePersistPeriod;
-    this.windowPeriod = windowPeriod == null ? DEFAULT_WINDOW_PERIOD : windowPeriod;
-    this.basePersistDirectory = basePersistDirectory;
-    this.versioningPolicy = versioningPolicy;
-    this.rejectionPolicyFactory = rejectionPolicyFactory == null
-                                  ? DEFAULT_REJECTION_POLICY_FACTORY
-                                  : rejectionPolicyFactory;
-    this.maxPendingPersists = maxPendingPersists == null ? DEFAULT_MAX_PENDING_PERSISTS : maxPendingPersists;
-    this.shardSpec = shardSpec == null ? DEFAULT_SHARD_SPEC : shardSpec;
-    this.indexSpec = indexSpec == null ? DEFAULT_INDEX_SPEC : indexSpec;
-    this.indexSpecForIntermediatePersists = indexSpecForIntermediatePersists == null ?
-                                            this.indexSpec : indexSpecForIntermediatePersists;
-    this.mergeThreadPriority = mergeThreadPriority;
-    this.persistThreadPriority = persistThreadPriority;
-    this.reportParseExceptions = reportParseExceptions == null
-                                 ? DEFAULT_REPORT_PARSE_EXCEPTIONS
-                                 : reportParseExceptions;
-    this.handoffConditionTimeout = handoffConditionTimeout == null
-                                   ? DEFAULT_HANDOFF_CONDITION_TIMEOUT
-                                   : handoffConditionTimeout;
-    Preconditions.checkArgument(this.handoffConditionTimeout >= 0, "handoffConditionTimeout must be >= 0");
-
-    this.alertTimeout = alertTimeout == null ? DEFAULT_ALERT_TIMEOUT : alertTimeout;
-    Preconditions.checkArgument(this.alertTimeout >= 0, "alertTimeout must be >= 0");
-    this.segmentWriteOutMediumFactory = segmentWriteOutMediumFactory;
-    this.dedupColumn = dedupColumn == null ? DEFAULT_DEDUP_COLUMN : dedupColumn;
-    this.numPersistThreads = numPersistThreads == null ?
-            DEFAULT_NUM_PERSIST_THREADS : Math.max(numPersistThreads, DEFAULT_NUM_PERSIST_THREADS);
-  }
-
-  @JsonCreator
-  private RealtimeTuningConfig(
-      @JsonProperty("appendableIndexSpec") @Nullable AppendableIndexSpec appendableIndexSpec,
-      @JsonProperty("maxRowsInMemory") Integer maxRowsInMemory,
-      @JsonProperty("maxBytesInMemory") Long maxBytesInMemory,
-      @JsonProperty("skipBytesInMemoryOverheadCheck") @Nullable Boolean skipBytesInMemoryOverheadCheck,
-      @JsonProperty("intermediatePersistPeriod") Period intermediatePersistPeriod,
-      @JsonProperty("windowPeriod") Period windowPeriod,
-      @JsonProperty("rejectionPolicy") RejectionPolicyFactory rejectionPolicyFactory,
-      @JsonProperty("maxPendingPersists") Integer maxPendingPersists,
-      @JsonProperty("shardSpec") ShardSpec shardSpec,
-      @JsonProperty("indexSpec") IndexSpec indexSpec,
-      @JsonProperty("indexSpecForIntermediatePersists") @Nullable IndexSpec indexSpecForIntermediatePersists,
-      @JsonProperty("persistThreadPriority") int persistThreadPriority,
-      @JsonProperty("mergeThreadPriority") int mergeThreadPriority,
-      @JsonProperty("reportParseExceptions") Boolean reportParseExceptions,
-      @JsonProperty("handoffConditionTimeout") Long handoffConditionTimeout,
-      @JsonProperty("alertTimeout") Long alertTimeout,
-      @JsonProperty("segmentWriteOutMediumFactory") @Nullable SegmentWriteOutMediumFactory segmentWriteOutMediumFactory,
-      @JsonProperty("dedupColumn") @Nullable String dedupColumn,
-      @JsonProperty("numPersistThreads") @Nullable Integer numPersistThreads
-  )
-  {
-    this(
-        appendableIndexSpec,
-        maxRowsInMemory,
-        maxBytesInMemory,
-        skipBytesInMemoryOverheadCheck,
-        intermediatePersistPeriod,
-        windowPeriod,
-        null,
-        null,
-        rejectionPolicyFactory,
-        maxPendingPersists,
-        shardSpec,
-        indexSpec,
-        indexSpecForIntermediatePersists,
-        persistThreadPriority,
-        mergeThreadPriority,
-        reportParseExceptions,
-        handoffConditionTimeout,
-        alertTimeout,
-        segmentWriteOutMediumFactory,
-        dedupColumn,
-        numPersistThreads
-    );
-  }
-
-  @Override
-  @JsonProperty
-  public AppendableIndexSpec getAppendableIndexSpec()
-  {
-    return appendableIndexSpec;
-  }
-
-  @Override
-  @JsonProperty
-  public int getMaxRowsInMemory()
-  {
-    return maxRowsInMemory;
-  }
-
-  @Override
-  @JsonProperty
-  public long getMaxBytesInMemory()
-  {
-    return maxBytesInMemory;
-  }
-
-  @JsonProperty
-  @Override
-  public boolean isSkipBytesInMemoryOverheadCheck()
-  {
-    return skipBytesInMemoryOverheadCheck;
-  }
-
-  @Override
-  @JsonProperty
-  public Period getIntermediatePersistPeriod()
-  {
-    return intermediatePersistPeriod;
-  }
-
-  @JsonProperty
-  public Period getWindowPeriod()
-  {
-    return windowPeriod;
-  }
-
-  @Override
-  public File getBasePersistDirectory()
-  {
-    return Preconditions.checkNotNull(basePersistDirectory, "basePersistDirectory not set");
-  }
-
-  public VersioningPolicy getVersioningPolicy()
-  {
-    return Preconditions.checkNotNull(versioningPolicy, "versioningPolicy not set");
-  }
-
-  @JsonProperty("rejectionPolicy")
-  public RejectionPolicyFactory getRejectionPolicyFactory()
-  {
-    return rejectionPolicyFactory;
-  }
-
-  @Override
-  @JsonProperty
-  public int getMaxPendingPersists()
-  {
-    return maxPendingPersists;
-  }
-
-  @Override
-  public PartitionsSpec getPartitionsSpec()
-  {
-    throw new UnsupportedOperationException();
-  }
-
-  @JsonProperty
-  public ShardSpec getShardSpec()
-  {
-    return shardSpec;
-  }
-
-  @Override
-  @JsonProperty
-  public IndexSpec getIndexSpec()
-  {
-    return indexSpec;
-  }
-
-  @JsonProperty
-  @Override
-  public IndexSpec getIndexSpecForIntermediatePersists()
-  {
-    return indexSpecForIntermediatePersists;
-  }
-
-  @JsonProperty
-  public int getPersistThreadPriority()
-  {
-    return this.persistThreadPriority;
-  }
-
-  @JsonProperty
-  public int getMergeThreadPriority()
-  {
-    return this.mergeThreadPriority;
-  }
-
-  @Override
-  @JsonProperty
-  public boolean isReportParseExceptions()
-  {
-    return reportParseExceptions;
-  }
-
-  @JsonProperty
-  public long getHandoffConditionTimeout()
-  {
-    return handoffConditionTimeout;
-  }
-
-  @JsonProperty
-  public long getAlertTimeout()
-  {
-    return alertTimeout;
-  }
-
-  @Override
-  @JsonProperty
-  @Nullable
-  public SegmentWriteOutMediumFactory getSegmentWriteOutMediumFactory()
-  {
-    return segmentWriteOutMediumFactory;
-  }
-
-  @JsonProperty
-  @Nullable
-  public String getDedupColumn()
-  {
-    return dedupColumn;
-  }
-
-  @Override
-  @JsonProperty
-  public int getNumPersistThreads()
-  {
-    return numPersistThreads;
-  }
-
-  public RealtimeTuningConfig withVersioningPolicy(VersioningPolicy policy)
-  {
-    return new RealtimeTuningConfig(
-        appendableIndexSpec,
-        maxRowsInMemory,
-        maxBytesInMemory,
-        skipBytesInMemoryOverheadCheck,
-        intermediatePersistPeriod,
-        windowPeriod,
-        basePersistDirectory,
-        policy,
-        rejectionPolicyFactory,
-        maxPendingPersists,
-        shardSpec,
-        indexSpec,
-        indexSpecForIntermediatePersists,
-        persistThreadPriority,
-        mergeThreadPriority,
-        reportParseExceptions,
-        handoffConditionTimeout,
-        alertTimeout,
-        segmentWriteOutMediumFactory,
-        dedupColumn,
-        numPersistThreads
-    );
-  }
-
-  @Override
-  public RealtimeTuningConfig withBasePersistDirectory(File dir)
-  {
-    return new RealtimeTuningConfig(
-        appendableIndexSpec,
-        maxRowsInMemory,
-        maxBytesInMemory,
-        skipBytesInMemoryOverheadCheck,
-        intermediatePersistPeriod,
-        windowPeriod,
-        dir,
-        versioningPolicy,
-        rejectionPolicyFactory,
-        maxPendingPersists,
-        shardSpec,
-        indexSpec,
-        indexSpecForIntermediatePersists,
-        persistThreadPriority,
-        mergeThreadPriority,
-        reportParseExceptions,
-        handoffConditionTimeout,
-        alertTimeout,
-        segmentWriteOutMediumFactory,
-        dedupColumn,
-        numPersistThreads
-    );
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/indexing/TuningConfig.java b/server/src/main/java/org/apache/druid/segment/indexing/TuningConfig.java
index ba638c2c485..e190106281a 100644
--- a/server/src/main/java/org/apache/druid/segment/indexing/TuningConfig.java
+++ b/server/src/main/java/org/apache/druid/segment/indexing/TuningConfig.java
@@ -19,7 +19,6 @@
 
 package org.apache.druid.segment.indexing;
 
-import com.fasterxml.jackson.annotation.JsonSubTypes;
 import com.fasterxml.jackson.annotation.JsonTypeInfo;
 import org.apache.druid.indexer.partitions.PartitionsSpec;
 import org.apache.druid.segment.IndexSpec;
@@ -29,9 +28,6 @@ import org.apache.druid.segment.incremental.OnheapIncrementalIndex;
 /**
  */
 @JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type")
-@JsonSubTypes(value = {
-    @JsonSubTypes.Type(name = "realtime", value = RealtimeTuningConfig.class)
-})
 public interface TuningConfig
 {
   boolean DEFAULT_LOG_PARSE_EXCEPTIONS = false;
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/FireDepartment.java b/server/src/main/java/org/apache/druid/segment/realtime/FireDepartment.java
deleted file mode 100644
index 2c25a1de174..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/FireDepartment.java
+++ /dev/null
@@ -1,100 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime;
-
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import com.google.common.base.Preconditions;
-import org.apache.druid.data.input.Firehose;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.IngestionSpec;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-
-import java.io.IOException;
-
-/**
- * A Fire Department has a Firehose and a Plumber.
- * <p>
- * This is a metaphor for a realtime stream (Firehose) and a coordinator of sinks (Plumber). The Firehose provides the
- * realtime stream of data.  The Plumber directs each drop of water from the firehose into the correct sink and makes
- * sure that the sinks don't overflow.
- */
-public class FireDepartment extends IngestionSpec<RealtimeIOConfig, RealtimeTuningConfig>
-{
-  private final DataSchema dataSchema;
-  private final RealtimeIOConfig ioConfig;
-  private final RealtimeTuningConfig tuningConfig;
-  private final FireDepartmentMetrics metrics = new FireDepartmentMetrics();
-
-  @JsonCreator
-  public FireDepartment(
-      @JsonProperty("dataSchema") DataSchema dataSchema,
-      @JsonProperty("ioConfig") RealtimeIOConfig ioConfig,
-      @JsonProperty("tuningConfig") RealtimeTuningConfig tuningConfig
-  )
-  {
-    super(dataSchema, ioConfig, tuningConfig);
-    Preconditions.checkNotNull(dataSchema, "dataSchema");
-    Preconditions.checkNotNull(ioConfig, "ioConfig");
-
-    this.dataSchema = dataSchema;
-    this.ioConfig = ioConfig;
-    this.tuningConfig = tuningConfig == null ? RealtimeTuningConfig.makeDefaultTuningConfig(null) : tuningConfig;
-
-  }
-
-  /**
-   * Provides the data schema for the feed that this FireDepartment is in charge of.
-   *
-   * @return the Schema for this feed.
-   */
-  @JsonProperty("dataSchema")
-  @Override
-  public DataSchema getDataSchema()
-  {
-    return dataSchema;
-  }
-
-  @JsonProperty("ioConfig")
-  @Override
-  public RealtimeIOConfig getIOConfig()
-  {
-    return ioConfig;
-  }
-
-  @JsonProperty("tuningConfig")
-  @Override
-  public RealtimeTuningConfig getTuningConfig()
-  {
-    return tuningConfig;
-  }
-
-  public Firehose connect() throws IOException
-  {
-    return ioConfig.getFirehoseFactory()
-                   .connect(Preconditions.checkNotNull(dataSchema.getParser(), "inputRowParser"), null);
-  }
-
-  public FireDepartmentMetrics getMetrics()
-  {
-    return metrics;
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/FireDepartmentConfig.java b/server/src/main/java/org/apache/druid/segment/realtime/FireDepartmentConfig.java
deleted file mode 100644
index 299bc6e5455..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/FireDepartmentConfig.java
+++ /dev/null
@@ -1,58 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime;
-
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import com.google.common.base.Preconditions;
-import org.joda.time.Period;
-
-/**
- */
-public class FireDepartmentConfig
-{
-  private final int maxRowsInMemory;
-  private final Period intermediatePersistPeriod;
-
-  @JsonCreator
-  public FireDepartmentConfig(
-      @JsonProperty("maxRowsInMemory") int maxRowsInMemory,
-      @JsonProperty("intermediatePersistPeriod") Period intermediatePersistPeriod
-  )
-  {
-    this.maxRowsInMemory = maxRowsInMemory;
-    this.intermediatePersistPeriod = intermediatePersistPeriod;
-
-    Preconditions.checkArgument(maxRowsInMemory > 0, "maxRowsInMemory[%s] should be greater than 0", maxRowsInMemory);
-    Preconditions.checkNotNull(intermediatePersistPeriod, "intermediatePersistPeriod");
-  }
-
-  @JsonProperty
-  public int getMaxRowsInMemory()
-  {
-    return maxRowsInMemory;
-  }
-
-  @JsonProperty
-  public Period getIntermediatePersistPeriod()
-  {
-    return intermediatePersistPeriod;
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/NoopSegmentPublisher.java b/server/src/main/java/org/apache/druid/segment/realtime/NoopSegmentPublisher.java
deleted file mode 100644
index ef1283843a4..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/NoopSegmentPublisher.java
+++ /dev/null
@@ -1,33 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime;
-
-import org.apache.druid.timeline.DataSegment;
-
-/**
- */
-public class NoopSegmentPublisher implements SegmentPublisher
-{
-  @Override
-  public void publishSegment(DataSegment segment)
-  {
-    // do nothing
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/RealtimeMetricsMonitor.java b/server/src/main/java/org/apache/druid/segment/realtime/RealtimeMetricsMonitor.java
deleted file mode 100644
index c923c9e7bbd..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/RealtimeMetricsMonitor.java
+++ /dev/null
@@ -1,132 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime;
-
-import com.google.common.collect.ImmutableMap;
-import com.google.inject.Inject;
-import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
-import org.apache.druid.java.util.metrics.AbstractMonitor;
-import org.apache.druid.java.util.metrics.MonitorUtils;
-import org.apache.druid.query.DruidMetrics;
-
-import java.util.HashMap;
-import java.util.List;
-import java.util.Map;
-
-/**
- * RealtimeMetricsMonitor is only used by RealtimeIndexTask, this monitor only supports FireDepartmentMetrics.
- * New ingestion task types should support RowIngestionMeters and use TaskRealtimeMetricsMonitor instead.
- * Please see the comment on RowIngestionMeters for more information regarding the relationship between
- * RowIngestionMeters and FireDepartmentMetrics.
- */
-public class RealtimeMetricsMonitor extends AbstractMonitor
-{
-  private static final EmittingLogger log = new EmittingLogger(RealtimeMetricsMonitor.class);
-
-  private final Map<FireDepartment, FireDepartmentMetrics> previousValues;
-  private final List<FireDepartment> fireDepartments;
-  private final Map<String, String[]> dimensions;
-
-  @Inject
-  public RealtimeMetricsMonitor(List<FireDepartment> fireDepartments)
-  {
-    this(fireDepartments, ImmutableMap.of());
-  }
-
-  public RealtimeMetricsMonitor(List<FireDepartment> fireDepartments, Map<String, String[]> dimensions)
-  {
-    this.fireDepartments = fireDepartments;
-    this.previousValues = new HashMap<>();
-    this.dimensions = ImmutableMap.copyOf(dimensions);
-  }
-
-  @Override
-  public boolean doMonitor(ServiceEmitter emitter)
-  {
-    for (FireDepartment fireDepartment : fireDepartments) {
-      FireDepartmentMetrics metrics = fireDepartment.getMetrics().snapshot();
-      FireDepartmentMetrics previous = previousValues.get(fireDepartment);
-
-      if (previous == null) {
-        previous = new FireDepartmentMetrics();
-      }
-
-      final ServiceMetricEvent.Builder builder = new ServiceMetricEvent.Builder()
-          .setDimension(DruidMetrics.DATASOURCE, fireDepartment.getDataSchema().getDataSource());
-      MonitorUtils.addDimensionsToBuilder(builder, dimensions);
-
-      final long thrownAway = metrics.thrownAway() - previous.thrownAway();
-      if (thrownAway > 0) {
-        log.warn(
-            "[%,d] events thrown away. Possible causes: null events, events filtered out by transformSpec, or events outside windowPeriod.",
-            thrownAway
-        );
-      }
-      emitter.emit(builder.setMetric("ingest/events/thrownAway", thrownAway));
-      final long unparseable = metrics.unparseable() - previous.unparseable();
-      if (unparseable > 0) {
-        log.error(
-            "[%,d] unparseable events discarded. Turn on debug logging to see exception stack trace.",
-            unparseable
-        );
-      }
-      emitter.emit(builder.setMetric("ingest/events/unparseable", unparseable));
-      final long dedup = metrics.dedup() - previous.dedup();
-      if (dedup > 0) {
-        log.warn("[%,d] duplicate events!", dedup);
-      }
-      emitter.emit(builder.setMetric("ingest/events/duplicate", dedup));
-
-      emitter.emit(builder.setMetric("ingest/events/processed", metrics.processed() - previous.processed()));
-      emitter.emit(builder.setMetric("ingest/rows/output", metrics.rowOutput() - previous.rowOutput()));
-      emitter.emit(builder.setMetric("ingest/persists/count", metrics.numPersists() - previous.numPersists()));
-      emitter.emit(builder.setMetric("ingest/persists/time", metrics.persistTimeMillis() - previous.persistTimeMillis()));
-      emitter.emit(builder.setMetric("ingest/persists/cpu", metrics.persistCpuTime() - previous.persistCpuTime()));
-      emitter.emit(
-          builder.setMetric(
-              "ingest/persists/backPressure",
-              metrics.persistBackPressureMillis() - previous.persistBackPressureMillis()
-          )
-      );
-      emitter.emit(builder.setMetric("ingest/persists/failed", metrics.failedPersists() - previous.failedPersists()));
-      emitter.emit(builder.setMetric("ingest/handoff/failed", metrics.failedHandoffs() - previous.failedHandoffs()));
-      emitter.emit(builder.setMetric("ingest/merge/time", metrics.mergeTimeMillis() - previous.mergeTimeMillis()));
-      emitter.emit(builder.setMetric("ingest/merge/cpu", metrics.mergeCpuTime() - previous.mergeCpuTime()));
-      emitter.emit(builder.setMetric("ingest/handoff/count", metrics.handOffCount() - previous.handOffCount()));
-      emitter.emit(builder.setMetric("ingest/sink/count", metrics.sinkCount()));
-
-      long messageGap = metrics.messageGap();
-      if (messageGap >= 0) {
-        emitter.emit(builder.setMetric("ingest/events/messageGap", messageGap));
-      }
-
-      long maxSegmentHandoffTime = metrics.maxSegmentHandoffTime();
-      if (maxSegmentHandoffTime >= 0) {
-        emitter.emit(builder.setMetric("ingest/handoff/time", maxSegmentHandoffTime));
-      }
-
-      previousValues.put(fireDepartment, metrics);
-    }
-
-    return true;
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/FireDepartmentMetrics.java b/server/src/main/java/org/apache/druid/segment/realtime/SegmentGenerationMetrics.java
similarity index 79%
rename from server/src/main/java/org/apache/druid/segment/realtime/FireDepartmentMetrics.java
rename to server/src/main/java/org/apache/druid/segment/realtime/SegmentGenerationMetrics.java
index 8fb1f1309c1..564a3322bf9 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/FireDepartmentMetrics.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/SegmentGenerationMetrics.java
@@ -25,17 +25,14 @@ import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.concurrent.atomic.AtomicLong;
 
 /**
+ * Metrics for segment generation.
  */
-public class FireDepartmentMetrics
+public class SegmentGenerationMetrics
 {
   private static final long NO_EMIT_SEGMENT_HANDOFF_TIME = -1L;
 
   private static final long NO_EMIT_MESSAGE_GAP = -1L;
 
-  private final AtomicLong processedCount = new AtomicLong(0);
-  private final AtomicLong processedWithErrorsCount = new AtomicLong(0);
-  private final AtomicLong thrownAwayCount = new AtomicLong(0);
-  private final AtomicLong unparseableCount = new AtomicLong(0);
   private final AtomicLong dedupCount = new AtomicLong(0);
   private final AtomicLong rowOutputCount = new AtomicLong(0);
   private final AtomicLong numPersists = new AtomicLong(0);
@@ -58,31 +55,6 @@ public class FireDepartmentMetrics
 
   private final AtomicLong maxSegmentHandoffTime = new AtomicLong(NO_EMIT_SEGMENT_HANDOFF_TIME);
 
-  public void incrementProcessed()
-  {
-    processedCount.incrementAndGet();
-  }
-
-  public void incrementProcessedWithErrors()
-  {
-    processedWithErrorsCount.incrementAndGet();
-  }
-
-  public void incrementThrownAway()
-  {
-    thrownAwayCount.incrementAndGet();
-  }
-
-  public void incrementDedup()
-  {
-    dedupCount.incrementAndGet();
-  }
-
-  public void incrementUnparseable()
-  {
-    unparseableCount.incrementAndGet();
-  }
-
   public void incrementRowOutputCount(long numRows)
   {
     rowOutputCount.addAndGet(numRows);
@@ -113,11 +85,6 @@ public class FireDepartmentMetrics
     failedHandoffs.incrementAndGet();
   }
 
-  public void incrementMergeTimeMillis(long millis)
-  {
-    mergeTimeMillis.addAndGet(millis);
-  }
-
   public void incrementMergedRows(long rows)
   {
     mergedRows.addAndGet(rows);
@@ -128,16 +95,6 @@ public class FireDepartmentMetrics
     pushedRows.addAndGet(rows);
   }
 
-  public void incrementMergeCpuTime(long mergeTime)
-  {
-    mergeCpuTime.addAndGet(mergeTime);
-  }
-
-  public void incrementPersistCpuTime(long persistTime)
-  {
-    persistCpuTime.addAndGet(persistTime);
-  }
-
   public void incrementHandOffCount()
   {
     handOffCount.incrementAndGet();
@@ -169,26 +126,6 @@ public class FireDepartmentMetrics
     return processingDone.get();
   }
 
-  public long processed()
-  {
-    return processedCount.get();
-  }
-
-  public long processedWithErrors()
-  {
-    return processedWithErrorsCount.get();
-  }
-
-  public long thrownAway()
-  {
-    return thrownAwayCount.get();
-  }
-
-  public long unparseable()
-  {
-    return unparseableCount.get();
-  }
-
   public long dedup()
   {
     return dedupCount.get();
@@ -268,13 +205,9 @@ public class FireDepartmentMetrics
     return maxSegmentHandoffTime.get();
   }
 
-  public FireDepartmentMetrics snapshot()
+  public SegmentGenerationMetrics snapshot()
   {
-    final FireDepartmentMetrics retVal = new FireDepartmentMetrics();
-    retVal.processedCount.set(processedCount.get());
-    retVal.processedWithErrorsCount.set(processedWithErrorsCount.get());
-    retVal.thrownAwayCount.set(thrownAwayCount.get());
-    retVal.unparseableCount.set(unparseableCount.get());
+    final SegmentGenerationMetrics retVal = new SegmentGenerationMetrics();
     retVal.dedupCount.set(dedupCount.get());
     retVal.rowOutputCount.set(rowOutputCount.get());
     retVal.numPersists.set(numPersists.get());
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/SegmentPublisher.java b/server/src/main/java/org/apache/druid/segment/realtime/SegmentPublisher.java
deleted file mode 100644
index 7910e211ca5..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/SegmentPublisher.java
+++ /dev/null
@@ -1,29 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime;
-
-import org.apache.druid.timeline.DataSegment;
-
-import java.io.IOException;
-
-public interface SegmentPublisher
-{
-  void publishSegment(DataSegment segment) throws IOException;
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorFactory.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorFactory.java
deleted file mode 100644
index 4b8698490e9..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorFactory.java
+++ /dev/null
@@ -1,40 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.appenderator;
-
-import com.fasterxml.jackson.annotation.JsonSubTypes;
-import com.fasterxml.jackson.annotation.JsonTypeInfo;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-
-@JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type")
-@JsonSubTypes(value = {
-    @JsonSubTypes.Type(name = "default", value = DefaultRealtimeAppenderatorFactory.class),
-    @JsonSubTypes.Type(name = "offline", value = DefaultOfflineAppenderatorFactory.class)
-})
-public interface AppenderatorFactory
-{
-  Appenderator build(
-      DataSchema schema,
-      RealtimeTuningConfig config,
-      FireDepartmentMetrics metrics
-  );
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorImpl.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorImpl.java
index 764d7239736..734abc6ed54 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorImpl.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorImpl.java
@@ -73,9 +73,9 @@ import org.apache.druid.segment.indexing.DataSchema;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
 import org.apache.druid.segment.metadata.FingerprintGenerator;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
 import org.apache.druid.segment.realtime.FireHydrant;
-import org.apache.druid.segment.realtime.plumber.Sink;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
+import org.apache.druid.segment.realtime.sink.Sink;
 import org.apache.druid.server.coordination.DataSegmentAnnouncer;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.SegmentId;
@@ -135,7 +135,7 @@ public class AppenderatorImpl implements Appenderator
   private final String myId;
   private final DataSchema schema;
   private final AppenderatorConfig tuningConfig;
-  private final FireDepartmentMetrics metrics;
+  private final SegmentGenerationMetrics metrics;
   private final DataSegmentPusher dataSegmentPusher;
   private final ObjectMapper objectMapper;
   private final DataSegmentAnnouncer segmentAnnouncer;
@@ -211,7 +211,7 @@ public class AppenderatorImpl implements Appenderator
       String id,
       DataSchema schema,
       AppenderatorConfig tuningConfig,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       DataSegmentAnnouncer segmentAnnouncer,
@@ -514,8 +514,7 @@ public class AppenderatorImpl implements Appenderator
           tuningConfig.getAppendableIndexSpec(),
           tuningConfig.getMaxRowsInMemory(),
           maxBytesTuningConfig,
-          useMaxMemoryEstimates,
-          null
+          useMaxMemoryEstimates
       );
       bytesCurrentlyInMemory.addAndGet(calculateSinkMemoryInUsed());
 
@@ -1340,7 +1339,6 @@ public class AppenderatorImpl implements Appenderator
             tuningConfig.getMaxRowsInMemory(),
             maxBytesTuningConfig,
             useMaxMemoryEstimates,
-            null,
             hydrants
         );
         rowsSoFar += currSink.getNumRows();
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumber.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumber.java
deleted file mode 100644
index 56af6382afa..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumber.java
+++ /dev/null
@@ -1,492 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.appenderator;
-
-import com.google.common.base.Function;
-import com.google.common.base.Joiner;
-import com.google.common.base.Stopwatch;
-import com.google.common.base.Supplier;
-import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.Lists;
-import com.google.common.util.concurrent.FutureCallback;
-import com.google.common.util.concurrent.Futures;
-import com.google.common.util.concurrent.MoreExecutors;
-import org.apache.druid.common.guava.ThreadRenamingCallable;
-import org.apache.druid.data.input.Committer;
-import org.apache.druid.data.input.InputRow;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.concurrent.Execs;
-import org.apache.druid.java.util.common.concurrent.ScheduledExecutors;
-import org.apache.druid.java.util.common.granularity.Granularity;
-import org.apache.druid.java.util.common.guava.Sequence;
-import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.query.Query;
-import org.apache.druid.query.QueryPlus;
-import org.apache.druid.query.QueryRunner;
-import org.apache.druid.query.context.ResponseContext;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
-import org.apache.druid.segment.incremental.IncrementalIndexAddResult;
-import org.apache.druid.segment.incremental.IndexSizeExceededException;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.segment.realtime.SegmentPublisher;
-import org.apache.druid.segment.realtime.plumber.Committers;
-import org.apache.druid.segment.realtime.plumber.Plumber;
-import org.apache.druid.segment.realtime.plumber.RejectionPolicy;
-import org.apache.druid.segment.realtime.plumber.VersioningPolicy;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-import org.apache.druid.timeline.DataSegment;
-import org.joda.time.DateTime;
-import org.joda.time.Duration;
-import org.joda.time.Interval;
-import org.joda.time.Period;
-
-import java.io.IOException;
-import java.util.ArrayList;
-import java.util.List;
-import java.util.Map;
-import java.util.concurrent.ConcurrentHashMap;
-import java.util.concurrent.ConcurrentMap;
-import java.util.concurrent.ScheduledExecutorService;
-import java.util.concurrent.TimeUnit;
-
-public class AppenderatorPlumber implements Plumber
-{
-  private static final EmittingLogger log = new EmittingLogger(AppenderatorPlumber.class);
-  private static final int WARN_DELAY = 1000;
-
-  private final DataSchema schema;
-  private final RealtimeTuningConfig config;
-  private final RejectionPolicy rejectionPolicy;
-  private final FireDepartmentMetrics metrics;
-  private final DataSegmentAnnouncer segmentAnnouncer;
-  private final SegmentPublisher segmentPublisher;
-  private final SegmentHandoffNotifier handoffNotifier;
-  private final Object handoffCondition = new Object();
-  private final ConcurrentMap<Long, SegmentIdWithShardSpec> segments = new ConcurrentHashMap<>();
-  private final Appenderator appenderator;
-
-  private volatile boolean shuttingDown = false;
-  private volatile boolean stopped = false;
-  private volatile boolean cleanShutdown = true;
-  private volatile ScheduledExecutorService scheduledExecutor = null;
-
-  private volatile Supplier<Committer> lastCommitterSupplier = null;
-
-  public AppenderatorPlumber(
-      DataSchema schema,
-      RealtimeTuningConfig config,
-      FireDepartmentMetrics metrics,
-      DataSegmentAnnouncer segmentAnnouncer,
-      SegmentPublisher segmentPublisher,
-      SegmentHandoffNotifier handoffNotifier,
-      Appenderator appenderator
-  )
-  {
-    this.schema = schema;
-    this.config = config;
-    this.rejectionPolicy = config.getRejectionPolicyFactory().create(config.getWindowPeriod());
-    this.metrics = metrics;
-    this.segmentAnnouncer = segmentAnnouncer;
-    this.segmentPublisher = segmentPublisher;
-    this.handoffNotifier = handoffNotifier;
-    this.appenderator = appenderator;
-
-    log.info("Creating plumber using rejectionPolicy[%s]", getRejectionPolicy());
-  }
-
-  public Map<Long, SegmentIdWithShardSpec> getSegmentsView()
-  {
-    return ImmutableMap.copyOf(segments);
-  }
-
-  public DataSchema getSchema()
-  {
-    return schema;
-  }
-
-  public RealtimeTuningConfig getConfig()
-  {
-    return config;
-  }
-
-  public RejectionPolicy getRejectionPolicy()
-  {
-    return rejectionPolicy;
-  }
-
-  @Override
-  public Object startJob()
-  {
-    handoffNotifier.start();
-    Object retVal = appenderator.startJob();
-    initializeExecutors();
-    startPersistThread();
-    // Push pending sinks bootstrapped from previous run
-    mergeAndPush();
-    return retVal;
-  }
-
-  @Override
-  public IncrementalIndexAddResult add(InputRow row, Supplier<Committer> committerSupplier)
-      throws IndexSizeExceededException
-  {
-    final SegmentIdWithShardSpec identifier = getSegmentIdentifier(row.getTimestampFromEpoch());
-    if (identifier == null) {
-      return Plumber.THROWAWAY;
-    }
-
-    try {
-      final Appenderator.AppenderatorAddResult addResult = appenderator.add(identifier, row, committerSupplier);
-      lastCommitterSupplier = committerSupplier;
-      return new IncrementalIndexAddResult(addResult.getNumRowsInSegment(), 0);
-    }
-    catch (SegmentNotWritableException e) {
-      // Segment already started handoff
-      return Plumber.NOT_WRITABLE;
-    }
-  }
-
-  @Override
-  public <T> QueryRunner<T> getQueryRunner(final Query<T> query)
-  {
-    return new QueryRunner<T>()
-    {
-      @Override
-      public Sequence<T> run(final QueryPlus<T> queryPlus, final ResponseContext responseContext)
-      {
-        return queryPlus.run(appenderator, responseContext);
-      }
-    };
-  }
-
-  @Override
-  public void persist(final Committer committer)
-  {
-    final Stopwatch runExecStopwatch = Stopwatch.createStarted();
-    appenderator.persistAll(committer);
-
-    final long startDelay = runExecStopwatch.elapsed(TimeUnit.MILLISECONDS);
-    metrics.incrementPersistBackPressureMillis(startDelay);
-    if (startDelay > WARN_DELAY) {
-      log.warn("Ingestion was throttled for [%,d] millis because persists were pending.", startDelay);
-    }
-    runExecStopwatch.stop();
-  }
-
-  @Override
-  public void finishJob()
-  {
-    log.info("Shutting down...");
-
-    shuttingDown = true;
-
-    List<SegmentIdWithShardSpec> pending = appenderator.getSegments();
-    if (pending.isEmpty()) {
-      log.info("No segments to hand off.");
-    } else {
-      log.info("Pushing segments: %s", Joiner.on(", ").join(pending));
-    }
-
-    try {
-      if (lastCommitterSupplier != null) {
-        // Push all remaining data
-        mergeAndPush();
-      }
-
-      synchronized (handoffCondition) {
-        while (!segments.isEmpty()) {
-          log.info("Waiting to hand off: %s", Joiner.on(", ").join(pending));
-          handoffCondition.wait();
-          pending = appenderator.getSegments();
-        }
-      }
-    }
-    catch (Exception e) {
-      throw new RuntimeException(e);
-    }
-    finally {
-      stopped = true;
-      handoffNotifier.close();
-      shutdownExecutors();
-      appenderator.close();
-    }
-
-    if (!cleanShutdown) {
-      throw new ISE("Exception occurred during persist and merge.");
-    }
-  }
-
-  private SegmentIdWithShardSpec getSegmentIdentifier(long timestamp)
-  {
-    if (!rejectionPolicy.accept(timestamp)) {
-      return null;
-    }
-
-    final Granularity segmentGranularity = schema.getGranularitySpec().getSegmentGranularity();
-    final VersioningPolicy versioningPolicy = config.getVersioningPolicy();
-
-    DateTime truncatedDateTime = segmentGranularity.bucketStart(DateTimes.utc(timestamp));
-    final long truncatedTime = truncatedDateTime.getMillis();
-
-    SegmentIdWithShardSpec retVal = segments.get(truncatedTime);
-
-    if (retVal == null) {
-      final Interval interval = new Interval(
-          truncatedDateTime,
-          segmentGranularity.increment(truncatedDateTime)
-      );
-
-      retVal = new SegmentIdWithShardSpec(
-          schema.getDataSource(),
-          interval,
-          versioningPolicy.getVersion(interval),
-          config.getShardSpec()
-      );
-      addSegment(retVal);
-
-    }
-
-    return retVal;
-  }
-
-  protected void initializeExecutors()
-  {
-    if (scheduledExecutor == null) {
-      scheduledExecutor = Execs.scheduledSingleThreaded("plumber_scheduled_%d");
-    }
-  }
-
-  protected void shutdownExecutors()
-  {
-    if (scheduledExecutor != null) {
-      scheduledExecutor.shutdown();
-    }
-  }
-
-  private void addSegment(final SegmentIdWithShardSpec identifier)
-  {
-    segments.put(identifier.getInterval().getStartMillis(), identifier);
-    try {
-      segmentAnnouncer.announceSegment(
-          new DataSegment(
-              identifier.getDataSource(),
-              identifier.getInterval(),
-              identifier.getVersion(),
-              ImmutableMap.of(),
-              ImmutableList.of(),
-              ImmutableList.of(),
-              identifier.getShardSpec(),
-              null,
-              0
-          )
-      );
-    }
-    catch (IOException e) {
-      log.makeAlert(e, "Failed to announce new segment[%s]", identifier.getDataSource())
-         .addData("interval", identifier.getInterval())
-         .emit();
-    }
-  }
-
-  public void dropSegment(final SegmentIdWithShardSpec identifier)
-  {
-    log.info("Dropping segment: %s", identifier);
-    segments.remove(identifier.getInterval().getStartMillis());
-
-    Futures.addCallback(
-        appenderator.drop(identifier),
-        new FutureCallback<Object>()
-        {
-          @Override
-          public void onSuccess(Object result)
-          {
-            log.info("Dropped segment: %s", identifier);
-          }
-
-          @Override
-          public void onFailure(Throwable e)
-          {
-            // TODO: Retry?
-            log.warn(e, "Failed to drop segment: %s", identifier);
-          }
-        },
-        MoreExecutors.directExecutor()
-    );
-  }
-
-  private void startPersistThread()
-  {
-    final Granularity segmentGranularity = schema.getGranularitySpec().getSegmentGranularity();
-    final Period windowPeriod = config.getWindowPeriod();
-
-    final DateTime truncatedNow = segmentGranularity.bucketStart(DateTimes.nowUtc());
-    final long windowMillis = windowPeriod.toStandardDuration().getMillis();
-
-    log.info(
-        "Expect to run at [%s]",
-        DateTimes.nowUtc().plus(
-            new Duration(
-                System.currentTimeMillis(),
-                segmentGranularity.increment(truncatedNow).getMillis() + windowMillis
-            )
-        )
-    );
-
-    String threadName = StringUtils.format(
-        "%s-overseer-%d",
-        schema.getDataSource(),
-        config.getShardSpec().getPartitionNum()
-    );
-    ThreadRenamingCallable<ScheduledExecutors.Signal> threadRenamingCallable =
-        new ThreadRenamingCallable<ScheduledExecutors.Signal>(threadName)
-        {
-          @Override
-          public ScheduledExecutors.Signal doCall()
-          {
-            if (stopped) {
-              log.info("Stopping merge-n-push overseer thread");
-              return ScheduledExecutors.Signal.STOP;
-            }
-
-            mergeAndPush();
-
-            if (stopped) {
-              log.info("Stopping merge-n-push overseer thread");
-              return ScheduledExecutors.Signal.STOP;
-            } else {
-              return ScheduledExecutors.Signal.REPEAT;
-            }
-          }
-        };
-    Duration initialDelay = new Duration(
-        System.currentTimeMillis(),
-        segmentGranularity.increment(truncatedNow).getMillis() + windowMillis
-    );
-    Duration rate = new Duration(truncatedNow, segmentGranularity.increment(truncatedNow));
-    ScheduledExecutors.scheduleAtFixedRate(scheduledExecutor, initialDelay, rate, threadRenamingCallable);
-  }
-
-  private void mergeAndPush()
-  {
-    final Granularity segmentGranularity = schema.getGranularitySpec().getSegmentGranularity();
-    final Period windowPeriod = config.getWindowPeriod();
-
-    final long windowMillis = windowPeriod.toStandardDuration().getMillis();
-    log.info("Starting merge and push.");
-    DateTime minTimestampAsDate = segmentGranularity.bucketStart(
-        DateTimes.utc(Math.max(windowMillis, rejectionPolicy.getCurrMaxTime().getMillis()) - windowMillis)
-    );
-    long minTimestamp = minTimestampAsDate.getMillis();
-
-    final List<SegmentIdWithShardSpec> appenderatorSegments = appenderator.getSegments();
-    final List<SegmentIdWithShardSpec> segmentsToPush = new ArrayList<>();
-
-    if (shuttingDown) {
-      log.info("Found [%,d] segments. Attempting to hand off all of them.", appenderatorSegments.size());
-      segmentsToPush.addAll(appenderatorSegments);
-    } else {
-      log.info(
-          "Found [%,d] segments. Attempting to hand off segments that start before [%s].",
-          appenderatorSegments.size(),
-          minTimestampAsDate
-      );
-
-      for (SegmentIdWithShardSpec segment : appenderatorSegments) {
-        final Long intervalStart = segment.getInterval().getStartMillis();
-        if (intervalStart < minTimestamp) {
-          log.info("Adding entry [%s] for merge and push.", segment);
-          segmentsToPush.add(segment);
-        } else {
-          log.info(
-              "Skipping persist and merge for entry [%s] : Start time [%s] >= [%s] min timestamp required in this run. Segment will be picked up in a future run.",
-              segment,
-              DateTimes.utc(intervalStart),
-              minTimestampAsDate
-          );
-        }
-      }
-    }
-
-    log.info("Found [%,d] segments to persist and merge", segmentsToPush.size());
-
-    final Function<Throwable, Void> errorHandler = new Function<Throwable, Void>()
-    {
-      @Override
-      public Void apply(Throwable throwable)
-      {
-        final List<String> segmentIdentifierStrings = Lists.transform(
-            segmentsToPush,
-            SegmentIdWithShardSpec::toString
-        );
-
-        log.makeAlert(throwable, "Failed to publish merged indexes[%s]", schema.getDataSource())
-           .addData("segments", segmentIdentifierStrings)
-           .emit();
-
-        if (shuttingDown) {
-          // We're trying to shut down, and these segments failed to push. Let's just get rid of them.
-          // This call will also delete possibly-partially-written files, so we don't need to do it explicitly.
-          cleanShutdown = false;
-          for (SegmentIdWithShardSpec identifier : segmentsToPush) {
-            dropSegment(identifier);
-          }
-        }
-
-        return null;
-      }
-    };
-
-    // WARNING: Committers.nil() here means that on-disk data can get out of sync with committing.
-    Futures.addCallback(
-        appenderator.push(segmentsToPush, Committers.nil(), false),
-        new FutureCallback<SegmentsAndCommitMetadata>()
-        {
-          @Override
-          public void onSuccess(SegmentsAndCommitMetadata result)
-          {
-            // Immediately publish after pushing
-            for (DataSegment pushedSegment : result.getSegments()) {
-              try {
-                segmentPublisher.publishSegment(pushedSegment);
-              }
-              catch (Exception e) {
-                errorHandler.apply(e);
-              }
-            }
-
-            log.info("Published [%,d] sinks.", segmentsToPush.size());
-          }
-
-          @Override
-          public void onFailure(Throwable e)
-          {
-            log.warn(e, "Failed to push [%,d] segments.", segmentsToPush.size());
-            errorHandler.apply(e);
-          }
-        },
-        MoreExecutors.directExecutor()
-    );
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumberSchool.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumberSchool.java
deleted file mode 100644
index 8d188111f64..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumberSchool.java
+++ /dev/null
@@ -1,84 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.appenderator;
-
-import com.fasterxml.jackson.annotation.JacksonInject;
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.segment.realtime.SegmentPublisher;
-import org.apache.druid.segment.realtime.plumber.Plumber;
-import org.apache.druid.segment.realtime.plumber.PlumberSchool;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-
-public class AppenderatorPlumberSchool implements PlumberSchool
-{
-  private final AppenderatorFactory appenderatorFactory;
-  private final DataSegmentAnnouncer segmentAnnouncer;
-  private final SegmentHandoffNotifierFactory handoffNotifierFactory;
-  private final SegmentPublisher segmentPublisher;
-
-  @JsonCreator
-  public AppenderatorPlumberSchool(
-      @JsonProperty("appenderator") AppenderatorFactory appenderatorFactory,
-      @JacksonInject DataSegmentAnnouncer segmentAnnouncer,
-      @JacksonInject SegmentHandoffNotifierFactory handoffNotifierFactory,
-      @JacksonInject SegmentPublisher segmentPublisher
-  )
-  {
-    this.appenderatorFactory = appenderatorFactory;
-    this.segmentAnnouncer = segmentAnnouncer;
-    this.handoffNotifierFactory = handoffNotifierFactory;
-    this.segmentPublisher = segmentPublisher;
-  }
-
-  @Override
-  public Plumber findPlumber(
-      final DataSchema schema,
-      final RealtimeTuningConfig config,
-      final FireDepartmentMetrics metrics
-  )
-  {
-    final Appenderator appenderator = appenderatorFactory.build(
-        schema,
-        config,
-        metrics
-    );
-
-    return new AppenderatorPlumber(
-        schema,
-        config,
-        metrics,
-        segmentAnnouncer,
-        segmentPublisher,
-        handoffNotifierFactory.createSegmentHandoffNotifier(schema.getDataSource()),
-        appenderator
-    );
-  }
-
-  @JsonProperty("appenderator")
-  public AppenderatorFactory getAppenderatorFactory()
-  {
-    return appenderatorFactory;
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/Appenderators.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/Appenderators.java
index 35cd526b1ea..56af5f3f62c 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/Appenderators.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/Appenderators.java
@@ -35,7 +35,7 @@ import org.apache.druid.segment.indexing.DataSchema;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.server.coordination.DataSegmentAnnouncer;
 import org.apache.druid.server.coordination.NoopDataSegmentAnnouncer;
 import org.apache.druid.timeline.VersionedIntervalTimeline;
@@ -47,7 +47,7 @@ public class Appenderators
       String id,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -101,7 +101,7 @@ public class Appenderators
       String id,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -135,7 +135,7 @@ public class Appenderators
       String id,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -173,7 +173,7 @@ public class Appenderators
       String id,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorsManager.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorsManager.java
index aa11d85ef35..3bbf364656e 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorsManager.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorsManager.java
@@ -38,7 +38,7 @@ import org.apache.druid.segment.join.JoinableFactory;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.server.coordination.DataSegmentAnnouncer;
 import org.joda.time.Interval;
 
@@ -70,7 +70,7 @@ public interface AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -96,7 +96,7 @@ public interface AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -111,7 +111,7 @@ public interface AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -126,7 +126,7 @@ public interface AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BatchAppenderator.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BatchAppenderator.java
index 128de15196d..b544d33705c 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BatchAppenderator.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BatchAppenderator.java
@@ -67,9 +67,9 @@ import org.apache.druid.segment.indexing.DataSchema;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
 import org.apache.druid.segment.metadata.FingerprintGenerator;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
 import org.apache.druid.segment.realtime.FireHydrant;
-import org.apache.druid.segment.realtime.plumber.Sink;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
+import org.apache.druid.segment.realtime.sink.Sink;
 import org.apache.druid.timeline.DataSegment;
 import org.joda.time.Interval;
 
@@ -113,7 +113,7 @@ public class BatchAppenderator implements Appenderator
   private final String myId;
   private final DataSchema schema;
   private final AppenderatorConfig tuningConfig;
-  private final FireDepartmentMetrics metrics;
+  private final SegmentGenerationMetrics metrics;
   private final DataSegmentPusher dataSegmentPusher;
   private final ObjectMapper objectMapper;
   private final IndexIO indexIO;
@@ -164,7 +164,7 @@ public class BatchAppenderator implements Appenderator
       String id,
       DataSchema schema,
       AppenderatorConfig tuningConfig,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -481,8 +481,7 @@ public class BatchAppenderator implements Appenderator
           tuningConfig.getAppendableIndexSpec(),
           tuningConfig.getMaxRowsInMemory(),
           maxBytesTuningConfig,
-          useMaxMemoryEstimates,
-          null
+          useMaxMemoryEstimates
       );
       bytesCurrentlyInMemory += calculateSinkMemoryInUsed();
       sinks.put(identifier, retVal);
@@ -1075,7 +1074,6 @@ public class BatchAppenderator implements Appenderator
         tuningConfig.getMaxRowsInMemory(),
         maxBytesTuningConfig,
         useMaxMemoryEstimates,
-        null,
         hydrants
     );
     retVal.finishWriting(); // this sink is not writable
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DefaultOfflineAppenderatorFactory.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DefaultOfflineAppenderatorFactory.java
deleted file mode 100644
index b5574c686c4..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DefaultOfflineAppenderatorFactory.java
+++ /dev/null
@@ -1,92 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.appenderator;
-
-import com.fasterxml.jackson.annotation.JacksonInject;
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import com.fasterxml.jackson.databind.ObjectMapper;
-import org.apache.druid.segment.IndexIO;
-import org.apache.druid.segment.IndexMerger;
-import org.apache.druid.segment.incremental.NoopRowIngestionMeters;
-import org.apache.druid.segment.incremental.ParseExceptionHandler;
-import org.apache.druid.segment.incremental.RowIngestionMeters;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.loading.DataSegmentPusher;
-import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-
-public class DefaultOfflineAppenderatorFactory implements AppenderatorFactory
-{
-  private final DataSegmentPusher dataSegmentPusher;
-  private final ObjectMapper objectMapper;
-  private final IndexIO indexIO;
-  private final IndexMerger indexMerger;
-  private final CentralizedDatasourceSchemaConfig centralizedDatasourceSchemaConfig;
-
-  @JsonCreator
-  public DefaultOfflineAppenderatorFactory(
-      @JacksonInject DataSegmentPusher dataSegmentPusher,
-      @JacksonInject ObjectMapper objectMapper,
-      @JacksonInject IndexIO indexIO,
-      @JacksonInject IndexMerger indexMerger,
-      @JsonProperty("centralizedDatasourceSchemaConfig") CentralizedDatasourceSchemaConfig centralizedDatasourceSchemaConfig
-  )
-  {
-    this.dataSegmentPusher = dataSegmentPusher;
-    this.objectMapper = objectMapper;
-    this.indexIO = indexIO;
-    this.indexMerger = indexMerger;
-    this.centralizedDatasourceSchemaConfig = centralizedDatasourceSchemaConfig;
-
-  }
-
-  @JsonProperty
-  public CentralizedDatasourceSchemaConfig getCentralizedDatasourceSchemaConfig()
-  {
-    return centralizedDatasourceSchemaConfig;
-  }
-
-  @Override
-  public Appenderator build(DataSchema schema, RealtimeTuningConfig config, FireDepartmentMetrics metrics)
-  {
-    final RowIngestionMeters rowIngestionMeters = new NoopRowIngestionMeters();
-    return Appenderators.createClosedSegmentsOffline(
-        schema.getDataSource(),
-        schema,
-        config,
-        metrics,
-        dataSegmentPusher,
-        objectMapper,
-        indexIO,
-        indexMerger,
-        rowIngestionMeters,
-        new ParseExceptionHandler(
-            rowIngestionMeters,
-            false,
-            config.isReportParseExceptions() ? 0 : Integer.MAX_VALUE,
-            0
-        ),
-        true,
-        centralizedDatasourceSchemaConfig
-    );
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DefaultRealtimeAppenderatorFactory.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DefaultRealtimeAppenderatorFactory.java
deleted file mode 100644
index e64c315484d..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DefaultRealtimeAppenderatorFactory.java
+++ /dev/null
@@ -1,142 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.appenderator;
-
-import com.fasterxml.jackson.annotation.JacksonInject;
-import com.fasterxml.jackson.databind.ObjectMapper;
-import org.apache.druid.client.cache.Cache;
-import org.apache.druid.client.cache.CacheConfig;
-import org.apache.druid.client.cache.CachePopulatorStats;
-import org.apache.druid.guice.annotations.Json;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.query.QueryProcessingPool;
-import org.apache.druid.query.QueryRunnerFactoryConglomerate;
-import org.apache.druid.segment.IndexIO;
-import org.apache.druid.segment.IndexMerger;
-import org.apache.druid.segment.incremental.NoopRowIngestionMeters;
-import org.apache.druid.segment.incremental.ParseExceptionHandler;
-import org.apache.druid.segment.incremental.RowIngestionMeters;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.join.JoinableFactory;
-import org.apache.druid.segment.loading.DataSegmentPusher;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-import org.apache.druid.timeline.partition.ShardSpec;
-
-import java.io.File;
-
-public class DefaultRealtimeAppenderatorFactory implements AppenderatorFactory
-{
-  private final ServiceEmitter emitter;
-  private final QueryRunnerFactoryConglomerate conglomerate;
-  private final DataSegmentAnnouncer segmentAnnouncer;
-  private final QueryProcessingPool queryProcessingPool;
-  private final JoinableFactory joinableFactory;
-  private final DataSegmentPusher dataSegmentPusher;
-  private final ObjectMapper jsonMapper;
-  private final IndexIO indexIO;
-  private final IndexMerger indexMerger;
-  private final Cache cache;
-  private final CacheConfig cacheConfig;
-  private final CachePopulatorStats cachePopulatorStats;
-
-  public DefaultRealtimeAppenderatorFactory(
-      @JacksonInject ServiceEmitter emitter,
-      @JacksonInject QueryRunnerFactoryConglomerate conglomerate,
-      @JacksonInject DataSegmentAnnouncer segmentAnnouncer,
-      @JacksonInject QueryProcessingPool queryProcessingPool,
-      @JacksonInject JoinableFactory joinableFactory,
-      @JacksonInject DataSegmentPusher dataSegmentPusher,
-      @JacksonInject @Json ObjectMapper jsonMapper,
-      @JacksonInject IndexIO indexIO,
-      @JacksonInject IndexMerger indexMerger,
-      @JacksonInject Cache cache,
-      @JacksonInject CacheConfig cacheConfig,
-      @JacksonInject CachePopulatorStats cachePopulatorStats
-  )
-  {
-    this.emitter = emitter;
-    this.conglomerate = conglomerate;
-    this.segmentAnnouncer = segmentAnnouncer;
-    this.queryProcessingPool = queryProcessingPool;
-    this.joinableFactory = joinableFactory;
-    this.dataSegmentPusher = dataSegmentPusher;
-    this.jsonMapper = jsonMapper;
-    this.indexIO = indexIO;
-    this.indexMerger = indexMerger;
-    this.cache = cache;
-    this.cacheConfig = cacheConfig;
-    this.cachePopulatorStats = cachePopulatorStats;
-  }
-
-  @Override
-  public Appenderator build(
-      final DataSchema schema,
-      final RealtimeTuningConfig config,
-      final FireDepartmentMetrics metrics
-  )
-  {
-    final RowIngestionMeters rowIngestionMeters = new NoopRowIngestionMeters();
-    return Appenderators.createRealtime(
-        null,
-        schema.getDataSource(),
-        schema,
-        config.withBasePersistDirectory(
-            makeBasePersistSubdirectory(
-                config.getBasePersistDirectory(),
-                schema.getDataSource(),
-                config.getShardSpec()
-            )
-        ),
-        metrics,
-        dataSegmentPusher,
-        jsonMapper,
-        indexIO,
-        indexMerger,
-        conglomerate,
-        segmentAnnouncer,
-        emitter,
-        queryProcessingPool,
-        cache,
-        cacheConfig,
-        cachePopulatorStats,
-        rowIngestionMeters,
-        new ParseExceptionHandler(
-            rowIngestionMeters,
-            false,
-            config.isReportParseExceptions() ? 0 : Integer.MAX_VALUE,
-            0
-        ),
-        true,
-        null
-    );
-  }
-
-  private static File makeBasePersistSubdirectory(
-      final File basePersistDirectory,
-      final String dataSource,
-      final ShardSpec shardSpec
-  )
-  {
-    final File dataSourceDirectory = new File(basePersistDirectory, dataSource);
-    return new File(dataSourceDirectory, String.valueOf(shardSpec.getPartitionNum()));
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DummyForInjectionAppenderatorsManager.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DummyForInjectionAppenderatorsManager.java
index 988d77b6f70..f44fffe20e1 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DummyForInjectionAppenderatorsManager.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/DummyForInjectionAppenderatorsManager.java
@@ -39,7 +39,7 @@ import org.apache.druid.segment.join.JoinableFactory;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.server.coordination.DataSegmentAnnouncer;
 import org.joda.time.Interval;
 
@@ -61,7 +61,7 @@ public class DummyForInjectionAppenderatorsManager implements AppenderatorsManag
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -88,7 +88,7 @@ public class DummyForInjectionAppenderatorsManager implements AppenderatorsManag
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -107,7 +107,7 @@ public class DummyForInjectionAppenderatorsManager implements AppenderatorsManag
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -126,7 +126,7 @@ public class DummyForInjectionAppenderatorsManager implements AppenderatorsManag
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/PeonAppenderatorsManager.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/PeonAppenderatorsManager.java
index c0f833ac594..52f75f72e47 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/PeonAppenderatorsManager.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/PeonAppenderatorsManager.java
@@ -39,7 +39,7 @@ import org.apache.druid.segment.join.JoinableFactory;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.server.coordination.DataSegmentAnnouncer;
 import org.joda.time.Interval;
 
@@ -67,7 +67,7 @@ public class PeonAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper jsonMapper,
       IndexIO indexIO,
@@ -122,7 +122,7 @@ public class PeonAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -160,7 +160,7 @@ public class PeonAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -198,7 +198,7 @@ public class PeonAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SegmentSchemas.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SegmentSchemas.java
index fbe2b6315ef..359da9bed76 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SegmentSchemas.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SegmentSchemas.java
@@ -30,7 +30,7 @@ import java.util.Objects;
 /**
  * Encapsulates schema information for multiple segments.
  * <p>
- * Primarily used to announce schema changes for all {@link org.apache.druid.segment.realtime.plumber.Sink}
+ * Primarily used to announce schema changes for all {@link org.apache.druid.segment.realtime.sink.Sink}
  * created by a task in {@link StreamAppenderator}.
  */
 public class SegmentSchemas
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SinkQuerySegmentWalker.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SinkQuerySegmentWalker.java
index aba071de1df..72cfe4de261 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SinkQuerySegmentWalker.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/SinkQuerySegmentWalker.java
@@ -59,8 +59,8 @@ import org.apache.druid.query.spec.SpecificSegmentSpec;
 import org.apache.druid.segment.SegmentReference;
 import org.apache.druid.segment.StorageAdapter;
 import org.apache.druid.segment.realtime.FireHydrant;
-import org.apache.druid.segment.realtime.plumber.Sink;
-import org.apache.druid.segment.realtime.plumber.SinkSegmentReference;
+import org.apache.druid.segment.realtime.sink.Sink;
+import org.apache.druid.segment.realtime.sink.SinkSegmentReference;
 import org.apache.druid.server.ResourceIdPopulatingQueryRunner;
 import org.apache.druid.timeline.SegmentId;
 import org.apache.druid.timeline.VersionedIntervalTimeline;
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderator.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderator.java
index 7a41ae3fb26..4d1253591e0 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderator.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderator.java
@@ -76,9 +76,9 @@ import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
 import org.apache.druid.segment.metadata.FingerprintGenerator;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
 import org.apache.druid.segment.realtime.FireHydrant;
-import org.apache.druid.segment.realtime.plumber.Sink;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
+import org.apache.druid.segment.realtime.sink.Sink;
 import org.apache.druid.server.coordination.DataSegmentAnnouncer;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.SegmentId;
@@ -134,7 +134,7 @@ public class StreamAppenderator implements Appenderator
   private final String myId;
   private final DataSchema schema;
   private final AppenderatorConfig tuningConfig;
-  private final FireDepartmentMetrics metrics;
+  private final SegmentGenerationMetrics metrics;
   private final DataSegmentPusher dataSegmentPusher;
   private final ObjectMapper objectMapper;
   private final DataSegmentAnnouncer segmentAnnouncer;
@@ -221,7 +221,7 @@ public class StreamAppenderator implements Appenderator
       String id,
       DataSchema schema,
       AppenderatorConfig tuningConfig,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       DataSegmentAnnouncer segmentAnnouncer,
@@ -533,8 +533,7 @@ public class StreamAppenderator implements Appenderator
           tuningConfig.getAppendableIndexSpec(),
           tuningConfig.getMaxRowsInMemory(),
           maxBytesTuningConfig,
-          useMaxMemoryEstimates,
-          null
+          useMaxMemoryEstimates
       );
       bytesCurrentlyInMemory.addAndGet(calculateSinkMemoryInUsed(retVal));
 
@@ -1391,7 +1390,6 @@ public class StreamAppenderator implements Appenderator
             tuningConfig.getMaxRowsInMemory(),
             maxBytesTuningConfig,
             useMaxMemoryEstimates,
-            null,
             hydrants
         );
         rowsSoFar += currSink.getNumRows();
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriver.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriver.java
index 2b5c153d602..89115874916 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriver.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriver.java
@@ -40,7 +40,7 @@ import org.apache.druid.query.SegmentDescriptor;
 import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
 import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
 import org.apache.druid.segment.loading.DataSegmentKiller;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.SegmentWithState.SegmentState;
 import org.apache.druid.timeline.DataSegment;
 import org.joda.time.Interval;
@@ -82,7 +82,7 @@ public class StreamAppenderatorDriver extends BaseAppenderatorDriver
   private static final long HANDOFF_TIME_THRESHOLD = 600_000;
 
   private final SegmentHandoffNotifier handoffNotifier;
-  private final FireDepartmentMetrics metrics;
+  private final SegmentGenerationMetrics metrics;
   private final ObjectMapper objectMapper;
 
   /**
@@ -102,7 +102,7 @@ public class StreamAppenderatorDriver extends BaseAppenderatorDriver
       UsedSegmentChecker usedSegmentChecker,
       DataSegmentKiller dataSegmentKiller,
       ObjectMapper objectMapper,
-      FireDepartmentMetrics metrics
+      SegmentGenerationMetrics metrics
   )
   {
     super(appenderator, segmentAllocator, usedSegmentChecker, dataSegmentKiller);
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UnifiedIndexerAppenderatorsManager.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UnifiedIndexerAppenderatorsManager.java
index 68ed2ae0d8f..ffdfb8d1eb0 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UnifiedIndexerAppenderatorsManager.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UnifiedIndexerAppenderatorsManager.java
@@ -64,8 +64,8 @@ import org.apache.druid.segment.join.JoinableFactoryWrapper;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.segment.realtime.plumber.Sink;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
+import org.apache.druid.segment.realtime.sink.Sink;
 import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
 import org.apache.druid.server.coordination.DataSegmentAnnouncer;
 import org.apache.druid.timeline.VersionedIntervalTimeline;
@@ -155,7 +155,7 @@ public class UnifiedIndexerAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -209,7 +209,7 @@ public class UnifiedIndexerAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -250,7 +250,7 @@ public class UnifiedIndexerAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
@@ -291,7 +291,7 @@ public class UnifiedIndexerAppenderatorsManager implements AppenderatorsManager
       String taskId,
       DataSchema schema,
       AppenderatorConfig config,
-      FireDepartmentMetrics metrics,
+      SegmentGenerationMetrics metrics,
       DataSegmentPusher dataSegmentPusher,
       ObjectMapper objectMapper,
       IndexIO indexIO,
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/CustomVersioningPolicy.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/CustomVersioningPolicy.java
deleted file mode 100644
index 1974dcec473..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/CustomVersioningPolicy.java
+++ /dev/null
@@ -1,52 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import org.apache.druid.java.util.common.DateTimes;
-import org.joda.time.Interval;
-
-/**
- */
-public class CustomVersioningPolicy implements VersioningPolicy
-{
-  private final String version;
-
-  @JsonCreator
-  public CustomVersioningPolicy(
-      @JsonProperty("version") String version
-  )
-  {
-    this.version = version == null ? DateTimes.nowUtc().toString() : version;
-  }
-
-  @Override
-  public String getVersion(Interval interval)
-  {
-    return version;
-  }
-
-  @JsonProperty("version")
-  public String getVersion()
-  {
-    return version;
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/FlushingPlumber.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/FlushingPlumber.java
deleted file mode 100644
index a271c4540c5..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/FlushingPlumber.java
+++ /dev/null
@@ -1,238 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.databind.ObjectMapper;
-import org.apache.druid.client.cache.Cache;
-import org.apache.druid.client.cache.CacheConfig;
-import org.apache.druid.client.cache.CachePopulatorStats;
-import org.apache.druid.common.guava.ThreadRenamingCallable;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.FileUtils;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.concurrent.Execs;
-import org.apache.druid.java.util.common.concurrent.ScheduledExecutors;
-import org.apache.druid.java.util.common.granularity.Granularity;
-import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.query.QueryProcessingPool;
-import org.apache.druid.query.QueryRunnerFactoryConglomerate;
-import org.apache.druid.segment.IndexIO;
-import org.apache.druid.segment.IndexMerger;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.join.JoinableFactory;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-import org.joda.time.DateTime;
-import org.joda.time.Duration;
-
-import java.io.IOException;
-import java.util.ArrayList;
-import java.util.List;
-import java.util.Map;
-import java.util.concurrent.Callable;
-import java.util.concurrent.ScheduledExecutorService;
-
-/**
- */
-public class FlushingPlumber extends RealtimePlumber
-{
-  private static final EmittingLogger log = new EmittingLogger(FlushingPlumber.class);
-
-  private final DataSchema schema;
-  private final RealtimeTuningConfig config;
-  private final Duration flushDuration;
-
-  private volatile ScheduledExecutorService flushScheduledExec = null;
-  private volatile boolean stopped = false;
-
-  public FlushingPlumber(
-      Duration flushDuration,
-      DataSchema schema,
-      RealtimeTuningConfig config,
-      FireDepartmentMetrics metrics,
-      ServiceEmitter emitter,
-      QueryRunnerFactoryConglomerate conglomerate,
-      DataSegmentAnnouncer segmentAnnouncer,
-      QueryProcessingPool queryProcessingPool,
-      JoinableFactory joinableFactory,
-      IndexMerger indexMerger,
-      IndexIO indexIO,
-      Cache cache,
-      CacheConfig cacheConfig,
-      CachePopulatorStats cachePopulatorStats,
-      ObjectMapper objectMapper
-
-  )
-  {
-    super(
-        schema,
-        config,
-        metrics,
-        emitter,
-        conglomerate,
-        segmentAnnouncer,
-        queryProcessingPool,
-        null,
-        null,
-        null,
-        indexMerger,
-        indexIO,
-        cache,
-        cacheConfig,
-        cachePopulatorStats,
-        objectMapper
-    );
-
-    this.flushDuration = flushDuration;
-    this.schema = schema;
-    this.config = config;
-  }
-
-  @Override
-  public Object startJob()
-  {
-    log.info("Starting job for %s", getSchema().getDataSource());
-
-    try {
-      FileUtils.mkdirp(computeBaseDir(getSchema()));
-    }
-    catch (IOException e) {
-      throw new RuntimeException(e);
-    }
-
-    initializeExecutors();
-
-    if (flushScheduledExec == null) {
-      flushScheduledExec = Execs.scheduledSingleThreaded("flushing_scheduled_%d");
-    }
-
-    Object retVal = bootstrapSinksFromDisk();
-    startFlushThread();
-    return retVal;
-  }
-
-  protected void flushAfterDuration(final long truncatedTime, final Sink sink)
-  {
-    log.info(
-        "Abandoning segment %s at %s",
-        sink.getSegment().getId(),
-        DateTimes.nowUtc().plusMillis((int) flushDuration.getMillis())
-    );
-
-    ScheduledExecutors.scheduleWithFixedDelay(
-        flushScheduledExec,
-        flushDuration,
-        new Callable<ScheduledExecutors.Signal>()
-        {
-          @Override
-          public ScheduledExecutors.Signal call()
-          {
-            log.info("Abandoning segment %s", sink.getSegment().getId());
-            abandonSegment(truncatedTime, sink);
-            return ScheduledExecutors.Signal.STOP;
-          }
-        }
-    );
-  }
-
-  private void startFlushThread()
-  {
-    final Granularity segmentGranularity = schema.getGranularitySpec().getSegmentGranularity();
-    final DateTime truncatedNow = segmentGranularity.bucketStart(DateTimes.nowUtc());
-    final long windowMillis = config.getWindowPeriod().toStandardDuration().getMillis();
-
-    log.info(
-        "Expect to run at [%s]",
-        DateTimes.nowUtc().plus(
-            new Duration(
-                System.currentTimeMillis(),
-                schema.getGranularitySpec().getSegmentGranularity().increment(truncatedNow).getMillis() + windowMillis
-            )
-        )
-    );
-
-    String threadName = StringUtils.format(
-        "%s-flusher-%d",
-        getSchema().getDataSource(),
-        getConfig().getShardSpec().getPartitionNum()
-    );
-    ThreadRenamingCallable<ScheduledExecutors.Signal> threadRenamingCallable =
-        new ThreadRenamingCallable<ScheduledExecutors.Signal>(threadName)
-        {
-          @Override
-          public ScheduledExecutors.Signal doCall()
-          {
-            if (stopped) {
-              log.info("Stopping flusher thread");
-              return ScheduledExecutors.Signal.STOP;
-            }
-
-            long minTimestamp = segmentGranularity.bucketStart(
-                getRejectionPolicy().getCurrMaxTime().minus(windowMillis)
-            ).getMillis();
-
-            List<Map.Entry<Long, Sink>> sinksToPush = new ArrayList<>();
-            for (Map.Entry<Long, Sink> entry : getSinks().entrySet()) {
-              final Long intervalStart = entry.getKey();
-              if (intervalStart < minTimestamp) {
-                log.info("Adding entry[%s] to flush.", entry);
-                sinksToPush.add(entry);
-              }
-            }
-
-            for (final Map.Entry<Long, Sink> entry : sinksToPush) {
-              flushAfterDuration(entry.getKey(), entry.getValue());
-            }
-
-            if (stopped) {
-              log.info("Stopping flusher thread");
-              return ScheduledExecutors.Signal.STOP;
-            } else {
-              return ScheduledExecutors.Signal.REPEAT;
-            }
-          }
-        };
-    Duration initialDelay = new Duration(
-        System.currentTimeMillis(),
-        schema.getGranularitySpec().getSegmentGranularity().increment(truncatedNow).getMillis() + windowMillis
-    );
-    Duration rate = new Duration(truncatedNow, segmentGranularity.increment(truncatedNow));
-    ScheduledExecutors.scheduleAtFixedRate(flushScheduledExec, initialDelay, rate, threadRenamingCallable);
-  }
-
-  @Override
-  public void finishJob()
-  {
-    log.info("Stopping job");
-
-    for (final Map.Entry<Long, Sink> entry : getSinks().entrySet()) {
-      abandonSegment(entry.getKey(), entry.getValue());
-    }
-    shutdownExecutors();
-
-    if (flushScheduledExec != null) {
-      flushScheduledExec.shutdown();
-    }
-
-    stopped = true;
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/FlushingPlumberSchool.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/FlushingPlumberSchool.java
deleted file mode 100644
index 787ea26cbc6..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/FlushingPlumberSchool.java
+++ /dev/null
@@ -1,145 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.annotation.JacksonInject;
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.annotation.JsonProperty;
-import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.base.Preconditions;
-import org.apache.druid.client.cache.Cache;
-import org.apache.druid.client.cache.CacheConfig;
-import org.apache.druid.client.cache.CachePopulatorStats;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.query.QueryProcessingPool;
-import org.apache.druid.query.QueryRunnerFactoryConglomerate;
-import org.apache.druid.segment.IndexIO;
-import org.apache.druid.segment.IndexMergerV9;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.join.JoinableFactory;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-import org.joda.time.Duration;
-
-/**
- * This plumber just drops segments at the end of a flush duration instead of handing them off. It is only useful if you want to run
- * a real time node without the rest of the Druid cluster.
- */
-public class FlushingPlumberSchool extends RealtimePlumberSchool
-{
-  private static final Duration DEFAULT_FLUSH_DURATION = new Duration("PT1H");
-
-  private final Duration flushDuration;
-
-  private final ServiceEmitter emitter;
-  private final QueryRunnerFactoryConglomerate conglomerate;
-  private final DataSegmentAnnouncer segmentAnnouncer;
-  private final QueryProcessingPool queryProcessingPool;
-  private final JoinableFactory joinableFactory;
-  private final IndexMergerV9 indexMergerV9;
-  private final IndexIO indexIO;
-  private final Cache cache;
-  private final CacheConfig cacheConfig;
-  private final CachePopulatorStats cachePopulatorStats;
-  private final ObjectMapper objectMapper;
-
-  @JsonCreator
-  public FlushingPlumberSchool(
-      @JsonProperty("flushDuration") Duration flushDuration,
-      @JacksonInject ServiceEmitter emitter,
-      @JacksonInject QueryRunnerFactoryConglomerate conglomerate,
-      @JacksonInject DataSegmentAnnouncer segmentAnnouncer,
-      @JacksonInject QueryProcessingPool queryProcessingPool,
-      @JacksonInject JoinableFactory joinableFactory,
-      @JacksonInject IndexMergerV9 indexMergerV9,
-      @JacksonInject IndexIO indexIO,
-      @JacksonInject Cache cache,
-      @JacksonInject CacheConfig cacheConfig,
-      @JacksonInject CachePopulatorStats cachePopulatorStats,
-      @JacksonInject ObjectMapper objectMapper
-  )
-  {
-    super(
-        emitter,
-        conglomerate,
-        null,
-        segmentAnnouncer,
-        null,
-        null,
-        queryProcessingPool,
-        joinableFactory,
-        indexMergerV9,
-        indexIO,
-        cache,
-        cacheConfig,
-        cachePopulatorStats,
-        objectMapper
-    );
-
-    this.flushDuration = flushDuration == null ? DEFAULT_FLUSH_DURATION : flushDuration;
-    this.emitter = emitter;
-    this.conglomerate = conglomerate;
-    this.segmentAnnouncer = segmentAnnouncer;
-    this.queryProcessingPool = queryProcessingPool;
-    this.joinableFactory = joinableFactory;
-    this.indexMergerV9 = Preconditions.checkNotNull(indexMergerV9, "Null IndexMergerV9");
-    this.indexIO = Preconditions.checkNotNull(indexIO, "Null IndexIO");
-    this.cache = cache;
-    this.cacheConfig = cacheConfig;
-    this.cachePopulatorStats = cachePopulatorStats;
-    this.objectMapper = objectMapper;
-  }
-
-  @Override
-  public Plumber findPlumber(
-      final DataSchema schema,
-      final RealtimeTuningConfig config,
-      final FireDepartmentMetrics metrics
-  )
-  {
-    verifyState();
-
-    return new FlushingPlumber(
-        flushDuration,
-        schema,
-        config,
-        metrics,
-        emitter,
-        conglomerate,
-        segmentAnnouncer,
-        queryProcessingPool,
-        joinableFactory,
-        indexMergerV9,
-        indexIO,
-        cache,
-        cacheConfig,
-        cachePopulatorStats,
-        objectMapper
-    );
-  }
-
-  private void verifyState()
-  {
-    Preconditions.checkNotNull(conglomerate, "must specify a queryRunnerFactoryConglomerate to do this action.");
-    Preconditions.checkNotNull(segmentAnnouncer, "must specify a segmentAnnouncer to do this action.");
-    Preconditions.checkNotNull(emitter, "must specify a serviceEmitter to do this action.");
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/IntervalStartVersioningPolicy.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/IntervalStartVersioningPolicy.java
deleted file mode 100644
index e343d4fe0df..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/IntervalStartVersioningPolicy.java
+++ /dev/null
@@ -1,31 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import org.joda.time.Interval;
-
-public class IntervalStartVersioningPolicy implements VersioningPolicy
-{
-  @Override
-  public String getVersion(Interval interval)
-  {
-    return interval.getStart().toString();
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/MessageTimeRejectionPolicyFactory.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/MessageTimeRejectionPolicyFactory.java
deleted file mode 100644
index 19fb37e3441..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/MessageTimeRejectionPolicyFactory.java
+++ /dev/null
@@ -1,90 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.JodaUtils;
-import org.apache.druid.java.util.common.StringUtils;
-import org.joda.time.DateTime;
-import org.joda.time.Period;
-
-import java.util.concurrent.atomic.AtomicLongFieldUpdater;
-
-public class MessageTimeRejectionPolicyFactory implements RejectionPolicyFactory
-{
-  @Override
-  public RejectionPolicy create(final Period windowPeriod)
-  {
-    final long windowMillis = windowPeriod.toStandardDuration().getMillis();
-    return new MessageTimeRejectionPolicy(windowMillis, windowPeriod);
-  }
-
-  private static class MessageTimeRejectionPolicy implements RejectionPolicy
-  {
-    private static final AtomicLongFieldUpdater<MessageTimeRejectionPolicy> MAX_TIMESTAMP_UPDATER =
-        AtomicLongFieldUpdater.newUpdater(MessageTimeRejectionPolicy.class, "maxTimestamp");
-    private final long windowMillis;
-    private final Period windowPeriod;
-    private volatile long maxTimestamp;
-
-    public MessageTimeRejectionPolicy(long windowMillis, Period windowPeriod)
-    {
-      this.windowMillis = windowMillis;
-      this.windowPeriod = windowPeriod;
-      this.maxTimestamp = JodaUtils.MIN_INSTANT;
-    }
-
-    @Override
-    public DateTime getCurrMaxTime()
-    {
-      return DateTimes.utc(maxTimestamp);
-    }
-
-    @Override
-    public boolean accept(long timestamp)
-    {
-      long maxTimestamp = this.maxTimestamp;
-      if (timestamp > maxTimestamp) {
-        maxTimestamp = tryUpdateMaxTimestamp(timestamp);
-      }
-
-      return timestamp >= (maxTimestamp - windowMillis);
-    }
-
-    private long tryUpdateMaxTimestamp(long timestamp)
-    {
-      long currentMaxTimestamp;
-      do {
-        currentMaxTimestamp = maxTimestamp;
-        if (timestamp <= currentMaxTimestamp) {
-          return currentMaxTimestamp;
-        }
-      } while (!MAX_TIMESTAMP_UPDATER.compareAndSet(this, currentMaxTimestamp, timestamp));
-      return timestamp;
-    }
-
-    @Override
-    public String toString()
-    {
-      return StringUtils.format("messageTime-%s", windowPeriod);
-    }
-  }
-}
-
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/NoopRejectionPolicyFactory.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/NoopRejectionPolicyFactory.java
deleted file mode 100644
index 6acce9abaa3..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/NoopRejectionPolicyFactory.java
+++ /dev/null
@@ -1,46 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import org.apache.druid.java.util.common.DateTimes;
-import org.joda.time.DateTime;
-import org.joda.time.Period;
-
-public class NoopRejectionPolicyFactory implements RejectionPolicyFactory
-{
-  @Override
-  public RejectionPolicy create(Period windowPeriod)
-  {
-    return new RejectionPolicy()
-    {
-      @Override
-      public DateTime getCurrMaxTime()
-      {
-        return DateTimes.EPOCH;
-      }
-
-      @Override
-      public boolean accept(long timestamp)
-      {
-        return true;
-      }
-    };
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/Plumber.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/Plumber.java
deleted file mode 100644
index e7fab4ae8a0..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/Plumber.java
+++ /dev/null
@@ -1,70 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.google.common.base.Supplier;
-import org.apache.druid.data.input.Committer;
-import org.apache.druid.data.input.InputRow;
-import org.apache.druid.query.Query;
-import org.apache.druid.query.QueryRunner;
-import org.apache.druid.segment.incremental.IncrementalIndexAddResult;
-import org.apache.druid.segment.incremental.IndexSizeExceededException;
-
-public interface Plumber
-{
-  IncrementalIndexAddResult THROWAWAY = new IncrementalIndexAddResult(-1, -1, "row too late");
-  IncrementalIndexAddResult NOT_WRITABLE = new IncrementalIndexAddResult(-1, -1, "not writable");
-  IncrementalIndexAddResult DUPLICATE = new IncrementalIndexAddResult(-2, -1, "duplicate row");
-
-  /**
-   * Perform any initial setup. Should be called before using any other methods, and should be paired
-   * with a corresponding call to {@link #finishJob}.
-   *
-   * @return the metadata of the "newest" segment that might have previously been persisted
-   */
-  Object startJob();
-
-  /**
-   * @param row               the row to insert
-   * @param committerSupplier supplier of a committer associated with all data that has been added, including this row
-   *
-   * @return IncrementalIndexAddResult whose rowCount
-   * - positive numbers indicate how many summarized rows exist in the index for that timestamp,
-   * -1 means a row was thrown away because it was too late
-   * -2 means a row was thrown away because it is duplicate
-   */
-  IncrementalIndexAddResult add(InputRow row, Supplier<Committer> committerSupplier) throws IndexSizeExceededException;
-
-  <T> QueryRunner<T> getQueryRunner(Query<T> query);
-
-  /**
-   * Persist any in-memory indexed data to durable storage. This may be only somewhat durable, e.g. the
-   * machine's local disk.
-   *
-   * @param committer committer to use after persisting data
-   */
-  void persist(Committer committer);
-
-  /**
-   * Perform any final processing and clean up after ourselves. Should be called after all data has been
-   * fed into sinks and persisted.
-   */
-  void finishJob();
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/PlumberSchool.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/PlumberSchool.java
deleted file mode 100644
index 849d5dbb184..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/PlumberSchool.java
+++ /dev/null
@@ -1,44 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.annotation.JsonSubTypes;
-import com.fasterxml.jackson.annotation.JsonTypeInfo;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-
-/**
- */
-@JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type", defaultImpl = RealtimePlumberSchool.class)
-@JsonSubTypes(value = {
-    @JsonSubTypes.Type(name = "realtime", value = RealtimePlumberSchool.class),
-    @JsonSubTypes.Type(name = "flushing", value = FlushingPlumberSchool.class)
-})
-public interface PlumberSchool
-{
-  /**
-   * Creates a Plumber
-   *
-   * @return returns a plumber
-   */
-  Plumber findPlumber(DataSchema schema, RealtimeTuningConfig config, FireDepartmentMetrics metrics);
-
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/Plumbers.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/Plumbers.java
deleted file mode 100644
index 44d611dfd0e..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/Plumbers.java
+++ /dev/null
@@ -1,96 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.google.common.base.Supplier;
-import org.apache.druid.data.input.Committer;
-import org.apache.druid.data.input.Firehose;
-import org.apache.druid.data.input.InputRow;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.java.util.common.parsers.ParseException;
-import org.apache.druid.segment.incremental.IncrementalIndexAddResult;
-import org.apache.druid.segment.incremental.IndexSizeExceededException;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-
-import java.io.IOException;
-
-public class Plumbers
-{
-  private static final Logger log = new Logger(Plumbers.class);
-
-  private Plumbers()
-  {
-    // No instantiation
-  }
-
-  public static void addNextRow(
-      final Supplier<Committer> committerSupplier,
-      final Firehose firehose,
-      final Plumber plumber,
-      final boolean reportParseExceptions,
-      final FireDepartmentMetrics metrics
-  ) throws IOException
-  {
-    final InputRow inputRow;
-    try {
-      inputRow = firehose.nextRow();
-    }
-    catch (ParseException e) {
-      if (reportParseExceptions) {
-        throw e;
-      } else {
-        log.debug(e, "Discarded row due to exception, considering unparseable.");
-        metrics.incrementUnparseable();
-        return;
-      }
-    }
-
-    if (inputRow == null) {
-      log.debug("Discarded null row, considering thrownAway.");
-      metrics.incrementThrownAway();
-      return;
-    }
-
-    final IncrementalIndexAddResult addResult;
-    try {
-      addResult = plumber.add(inputRow, committerSupplier);
-    }
-    catch (IndexSizeExceededException e) {
-      // Shouldn't happen if this is only being called by a single thread.
-      // plumber.add should be swapping out indexes before they fill up.
-      throw new ISE(e, "Index size exceeded");
-    }
-
-    if (addResult.getRowCount() == -1) {
-      metrics.incrementThrownAway();
-      log.debug("Discarded row[%s], considering thrownAway due to %s.", inputRow, addResult.getReasonOfNotAdded());
-      return;
-    }
-
-    if (addResult.getRowCount() == -2) {
-      metrics.incrementDedup();
-      log.debug("Discarded row[%s], considering duplication.", inputRow);
-      return;
-    }
-
-    metrics.incrementProcessed();
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/RealtimePlumber.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/RealtimePlumber.java
deleted file mode 100644
index 0380abf9f22..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/RealtimePlumber.java
+++ /dev/null
@@ -1,1014 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Stopwatch;
-import com.google.common.base.Supplier;
-import com.google.common.collect.Collections2;
-import com.google.common.collect.ImmutableMap;
-import com.google.common.primitives.Ints;
-import org.apache.druid.client.cache.Cache;
-import org.apache.druid.client.cache.CacheConfig;
-import org.apache.druid.client.cache.CachePopulatorStats;
-import org.apache.druid.common.guava.ThreadRenamingCallable;
-import org.apache.druid.common.guava.ThreadRenamingRunnable;
-import org.apache.druid.concurrent.TaskThreadPriority;
-import org.apache.druid.data.input.Committer;
-import org.apache.druid.data.input.InputRow;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.FileUtils;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.java.util.common.Pair;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.concurrent.Execs;
-import org.apache.druid.java.util.common.concurrent.ScheduledExecutors;
-import org.apache.druid.java.util.common.granularity.Granularity;
-import org.apache.druid.java.util.common.io.Closer;
-import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.query.Query;
-import org.apache.druid.query.QueryProcessingPool;
-import org.apache.druid.query.QueryRunner;
-import org.apache.druid.query.QueryRunnerFactoryConglomerate;
-import org.apache.druid.query.QuerySegmentWalker;
-import org.apache.druid.query.SegmentDescriptor;
-import org.apache.druid.segment.BaseProgressIndicator;
-import org.apache.druid.segment.IndexIO;
-import org.apache.druid.segment.IndexMerger;
-import org.apache.druid.segment.Metadata;
-import org.apache.druid.segment.QueryableIndex;
-import org.apache.druid.segment.QueryableIndexSegment;
-import org.apache.druid.segment.ReferenceCountingSegment;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
-import org.apache.druid.segment.incremental.IncrementalIndexAddResult;
-import org.apache.druid.segment.incremental.IndexSizeExceededException;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.loading.DataSegmentPusher;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.segment.realtime.FireHydrant;
-import org.apache.druid.segment.realtime.SegmentPublisher;
-import org.apache.druid.segment.realtime.appenderator.SinkQuerySegmentWalker;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-import org.apache.druid.timeline.DataSegment;
-import org.apache.druid.timeline.SegmentId;
-import org.apache.druid.timeline.VersionedIntervalTimeline;
-import org.apache.druid.timeline.partition.SingleElementPartitionChunk;
-import org.apache.druid.utils.JvmUtils;
-import org.joda.time.DateTime;
-import org.joda.time.Duration;
-import org.joda.time.Interval;
-import org.joda.time.Period;
-
-import java.io.Closeable;
-import java.io.File;
-import java.io.FilenameFilter;
-import java.io.IOException;
-import java.util.ArrayList;
-import java.util.Arrays;
-import java.util.Comparator;
-import java.util.List;
-import java.util.Map;
-import java.util.concurrent.ConcurrentHashMap;
-import java.util.concurrent.ConcurrentMap;
-import java.util.concurrent.ExecutorService;
-import java.util.concurrent.ScheduledExecutorService;
-import java.util.concurrent.TimeUnit;
-
-/**
- *
- */
-public class RealtimePlumber implements Plumber
-{
-  private static final EmittingLogger log = new EmittingLogger(RealtimePlumber.class);
-  private static final int WARN_DELAY = 1000;
-
-  private final DataSchema schema;
-  private final RealtimeTuningConfig config;
-  private final RejectionPolicy rejectionPolicy;
-  private final FireDepartmentMetrics metrics;
-  private final DataSegmentAnnouncer segmentAnnouncer;
-  private final DataSegmentPusher dataSegmentPusher;
-  private final SegmentPublisher segmentPublisher;
-  private final SegmentHandoffNotifier handoffNotifier;
-  private final Object handoffCondition = new Object();
-  private final ConcurrentMap<Long, Sink> sinks = new ConcurrentHashMap<>();
-  private final VersionedIntervalTimeline<String, Sink> sinkTimeline = new VersionedIntervalTimeline<String, Sink>(
-      String.CASE_INSENSITIVE_ORDER
-  );
-  private final QuerySegmentWalker texasRanger;
-  private final Cache cache;
-
-  private volatile long nextFlush = 0;
-  private volatile boolean shuttingDown = false;
-  private volatile boolean stopped = false;
-  private volatile boolean cleanShutdown = true;
-  private volatile ExecutorService persistExecutor = null;
-  private volatile ExecutorService mergeExecutor = null;
-  private volatile ScheduledExecutorService scheduledExecutor = null;
-  private volatile IndexMerger indexMerger;
-  private volatile IndexIO indexIO;
-
-  private static final String COMMIT_METADATA_KEY = "%commitMetadata%";
-  private static final String COMMIT_METADATA_TIMESTAMP_KEY = "%commitMetadataTimestamp%";
-
-  public RealtimePlumber(
-      DataSchema schema,
-      RealtimeTuningConfig config,
-      FireDepartmentMetrics metrics,
-      ServiceEmitter emitter,
-      QueryRunnerFactoryConglomerate conglomerate,
-      DataSegmentAnnouncer segmentAnnouncer,
-      QueryProcessingPool queryProcessingPool,
-      DataSegmentPusher dataSegmentPusher,
-      SegmentPublisher segmentPublisher,
-      SegmentHandoffNotifier handoffNotifier,
-      IndexMerger indexMerger,
-      IndexIO indexIO,
-      Cache cache,
-      CacheConfig cacheConfig,
-      CachePopulatorStats cachePopulatorStats,
-      ObjectMapper objectMapper
-  )
-  {
-    this.schema = schema;
-    this.config = config;
-    this.rejectionPolicy = config.getRejectionPolicyFactory().create(config.getWindowPeriod());
-    this.metrics = metrics;
-    this.segmentAnnouncer = segmentAnnouncer;
-    this.dataSegmentPusher = dataSegmentPusher;
-    this.segmentPublisher = segmentPublisher;
-    this.handoffNotifier = handoffNotifier;
-    this.indexMerger = Preconditions.checkNotNull(indexMerger, "Null IndexMerger");
-    this.indexIO = Preconditions.checkNotNull(indexIO, "Null IndexIO");
-    this.cache = cache;
-    this.texasRanger = new SinkQuerySegmentWalker(
-        schema.getDataSource(),
-        sinkTimeline,
-        objectMapper,
-        emitter,
-        conglomerate,
-        queryProcessingPool,
-        cache,
-        cacheConfig,
-        cachePopulatorStats
-    );
-
-    log.info("Creating plumber using rejectionPolicy[%s]", getRejectionPolicy());
-  }
-
-  public DataSchema getSchema()
-  {
-    return schema;
-  }
-
-  public RealtimeTuningConfig getConfig()
-  {
-    return config;
-  }
-
-  public RejectionPolicy getRejectionPolicy()
-  {
-    return rejectionPolicy;
-  }
-
-  public Map<Long, Sink> getSinks()
-  {
-    return sinks;
-  }
-
-  @Override
-  public Object startJob()
-  {
-    try {
-      FileUtils.mkdirp(computeBaseDir(schema));
-    }
-    catch (IOException e) {
-      throw new RuntimeException(e);
-    }
-
-    initializeExecutors();
-    handoffNotifier.start();
-    Object retVal = bootstrapSinksFromDisk();
-    startPersistThread();
-    // Push pending sinks bootstrapped from previous run
-    mergeAndPush();
-    resetNextFlush();
-    return retVal;
-  }
-
-  @Override
-  public IncrementalIndexAddResult add(InputRow row, Supplier<Committer> committerSupplier)
-      throws IndexSizeExceededException
-  {
-    long messageTimestamp = row.getTimestampFromEpoch();
-    final Sink sink = getSink(messageTimestamp);
-    metrics.reportMessageMaxTimestamp(messageTimestamp);
-    if (sink == null) {
-      return Plumber.THROWAWAY;
-    }
-
-    final IncrementalIndexAddResult addResult = sink.add(row, false);
-    if (config.isReportParseExceptions() && addResult.getParseException() != null) {
-      throw addResult.getParseException();
-    }
-
-    if (!sink.canAppendRow() || System.currentTimeMillis() > nextFlush) {
-      persist(committerSupplier.get());
-    }
-
-    return addResult;
-  }
-
-  private Sink getSink(long timestamp)
-  {
-    if (!rejectionPolicy.accept(timestamp)) {
-      return null;
-    }
-
-    final Granularity segmentGranularity = schema.getGranularitySpec().getSegmentGranularity();
-    final VersioningPolicy versioningPolicy = config.getVersioningPolicy();
-
-    DateTime truncatedDateTime = segmentGranularity.bucketStart(DateTimes.utc(timestamp));
-    final long truncatedTime = truncatedDateTime.getMillis();
-
-    Sink retVal = sinks.get(truncatedTime);
-
-    if (retVal == null) {
-      final Interval sinkInterval = new Interval(
-          truncatedDateTime,
-          segmentGranularity.increment(truncatedDateTime)
-      );
-
-      retVal = new Sink(
-          sinkInterval,
-          schema,
-          config.getShardSpec(),
-          versioningPolicy.getVersion(sinkInterval),
-          config.getAppendableIndexSpec(),
-          config.getMaxRowsInMemory(),
-          config.getMaxBytesInMemoryOrDefault(),
-          true,
-          config.getDedupColumn()
-      );
-      addSink(retVal);
-
-    }
-
-    return retVal;
-  }
-
-  @Override
-  public <T> QueryRunner<T> getQueryRunner(final Query<T> query)
-  {
-    // Calling getQueryRunnerForIntervals here works because there's only one segment per interval for RealtimePlumber.
-    return texasRanger.getQueryRunnerForIntervals(query, query.getIntervals());
-  }
-
-  @Override
-  public void persist(final Committer committer)
-  {
-    final List<Pair<FireHydrant, Interval>> indexesToPersist = new ArrayList<>();
-    for (Sink sink : sinks.values()) {
-      if (sink.swappable()) {
-        indexesToPersist.add(Pair.of(sink.swap(), sink.getInterval()));
-      }
-    }
-
-    log.info("Submitting persist runnable for dataSource[%s]", schema.getDataSource());
-
-    final Stopwatch runExecStopwatch = Stopwatch.createStarted();
-    final Stopwatch persistStopwatch = Stopwatch.createStarted();
-
-    final Map<String, Object> metadataElems = committer.getMetadata() == null ? null :
-                                              ImmutableMap.of(
-                                                  COMMIT_METADATA_KEY,
-                                                  committer.getMetadata(),
-                                                  COMMIT_METADATA_TIMESTAMP_KEY,
-                                                  System.currentTimeMillis()
-                                              );
-
-    persistExecutor.execute(
-        new ThreadRenamingRunnable(StringUtils.format("%s-incremental-persist", schema.getDataSource()))
-        {
-          @Override
-          public void doRun()
-          {
-            /* Note:
-            If plumber crashes after storing a subset of all the hydrants then we will lose data and next
-            time we will start with the commitMetadata stored in those hydrants.
-            option#1:
-            maybe it makes sense to store the metadata outside the segments in a separate file. This is because the
-            commit metadata isn't really associated with an individual segment-- it's associated with a set of segments
-            that are persisted at the same time or maybe whole datasource. So storing it in the segments is asking for problems.
-            Sort of like this:
-
-            {
-              "metadata" : {"foo": "bar"},
-              "segments": [
-                {"id": "datasource_2000_2001_2000_1", "hydrant": 10},
-                {"id": "datasource_2001_2002_2001_1", "hydrant": 12},
-              ]
-            }
-            When a realtime node crashes and starts back up, it would delete any hydrants numbered higher than the
-            ones in the commit file.
-
-            option#2
-            We could also just include the set of segments for the same chunk of metadata in more metadata on each
-            of the segments. we might also have to think about the hand-off in terms of the full set of segments being
-            handed off instead of individual segments being handed off (that is, if one of the set succeeds in handing
-            off and the others fail, the real-time would believe that it needs to re-ingest the data).
-             */
-            long persistThreadCpuTime = JvmUtils.safeGetThreadCpuTime();
-            try {
-              for (Pair<FireHydrant, Interval> pair : indexesToPersist) {
-                metrics.incrementRowOutputCount(
-                    persistHydrant(pair.lhs, schema, pair.rhs, metadataElems)
-                );
-              }
-              committer.run();
-            }
-            catch (Exception e) {
-              metrics.incrementFailedPersists();
-              throw e;
-            }
-            finally {
-              metrics.incrementPersistCpuTime(JvmUtils.safeGetThreadCpuTime() - persistThreadCpuTime);
-              metrics.incrementNumPersists();
-              metrics.incrementPersistTimeMillis(persistStopwatch.elapsed(TimeUnit.MILLISECONDS));
-              persistStopwatch.stop();
-            }
-          }
-        }
-    );
-
-    final long startDelay = runExecStopwatch.elapsed(TimeUnit.MILLISECONDS);
-    metrics.incrementPersistBackPressureMillis(startDelay);
-    if (startDelay > WARN_DELAY) {
-      log.warn("Ingestion was throttled for [%,d] millis because persists were pending.", startDelay);
-    }
-    runExecStopwatch.stop();
-    resetNextFlush();
-  }
-
-  // Submits persist-n-merge task for a Sink to the mergeExecutor
-  private void persistAndMerge(final long truncatedTime, final Sink sink)
-  {
-    final String threadName = StringUtils.format(
-        "%s-%s-persist-n-merge", schema.getDataSource(), DateTimes.utc(truncatedTime)
-    );
-    mergeExecutor.execute(
-        new ThreadRenamingRunnable(threadName)
-        {
-          final Interval interval = sink.getInterval();
-          Stopwatch mergeStopwatch = null;
-
-          @Override
-          public void doRun()
-          {
-            try {
-              // Bail out if this sink has been abandoned by a previously-executed task.
-              if (sinks.get(truncatedTime) != sink) {
-                log.info("Sink[%s] was abandoned, bailing out of persist-n-merge.", sink);
-                return;
-              }
-
-              // Use a file to indicate that pushing has completed.
-              final File persistDir = computePersistDir(schema, interval);
-              final File mergedTarget = new File(persistDir, "merged");
-              final File isPushedMarker = new File(persistDir, "isPushedMarker");
-
-              if (!isPushedMarker.exists()) {
-                removeSegment(sink, mergedTarget);
-                if (mergedTarget.exists()) {
-                  log.warn("Merged target[%s] still exists after attempt to delete it; skipping push.", mergedTarget);
-                  return;
-                }
-              } else {
-                log.info("Already pushed sink[%s]", sink);
-                return;
-              }
-
-            /*
-            Note: it the plumber crashes after persisting a subset of hydrants then might duplicate data as these
-            hydrants will be read but older commitMetadata will be used. fixing this possibly needs structural
-            changes to plumber.
-             */
-              for (FireHydrant hydrant : sink) {
-                synchronized (hydrant) {
-                  if (!hydrant.hasSwapped()) {
-                    log.info("Hydrant[%s] hasn't swapped yet, swapping. Sink[%s]", hydrant, sink);
-                    final int rowCount = persistHydrant(hydrant, schema, interval, null);
-                    metrics.incrementRowOutputCount(rowCount);
-                  }
-                }
-              }
-              final long mergeThreadCpuTime = JvmUtils.safeGetThreadCpuTime();
-              mergeStopwatch = Stopwatch.createStarted();
-
-              final File mergedFile;
-              List<QueryableIndex> indexes = new ArrayList<>();
-              Closer closer = Closer.create();
-              try {
-                for (FireHydrant fireHydrant : sink) {
-                  Pair<ReferenceCountingSegment, Closeable> segmentAndCloseable = fireHydrant.getAndIncrementSegment();
-                  final QueryableIndex queryableIndex = segmentAndCloseable.lhs.asQueryableIndex();
-                  log.info("Adding hydrant[%s]", fireHydrant);
-                  indexes.add(queryableIndex);
-                  closer.register(segmentAndCloseable.rhs);
-                }
-
-                mergedFile = indexMerger.mergeQueryableIndex(
-                    indexes,
-                    schema.getGranularitySpec().isRollup(),
-                    schema.getAggregators(),
-                    null,
-                    mergedTarget,
-                    config.getIndexSpec(),
-                    config.getIndexSpecForIntermediatePersists(),
-                    new BaseProgressIndicator(),
-                    config.getSegmentWriteOutMediumFactory(),
-                    -1
-                );
-              }
-              catch (Throwable t) {
-                throw closer.rethrow(t);
-              }
-              finally {
-                closer.close();
-              }
-
-              // emit merge metrics before publishing segment
-              metrics.incrementMergeCpuTime(JvmUtils.safeGetThreadCpuTime() - mergeThreadCpuTime);
-              metrics.incrementMergeTimeMillis(mergeStopwatch.elapsed(TimeUnit.MILLISECONDS));
-
-              log.info("Pushing [%s] to deep storage", sink.getSegment().getId());
-
-              DataSegment segment = dataSegmentPusher.push(
-                  mergedFile,
-                  sink.getSegment().withDimensions(IndexMerger.getMergedDimensionsFromQueryableIndexes(indexes, schema.getDimensionsSpec())),
-                  false
-              );
-              log.info("Inserting [%s] to the metadata store", sink.getSegment().getId());
-              segmentPublisher.publishSegment(segment);
-
-              if (!isPushedMarker.createNewFile()) {
-                log.makeAlert("Failed to create marker file for [%s]", schema.getDataSource())
-                   .addData("interval", sink.getInterval())
-                   .addData("partitionNum", segment.getShardSpec().getPartitionNum())
-                   .addData("marker", isPushedMarker)
-                   .emit();
-              }
-            }
-            catch (Exception e) {
-              metrics.incrementFailedHandoffs();
-              log.makeAlert(e, "Failed to persist merged index[%s]", schema.getDataSource())
-                 .addData("interval", interval)
-                 .emit();
-              if (shuttingDown) {
-                // We're trying to shut down, and this segment failed to push. Let's just get rid of it.
-                // This call will also delete possibly-partially-written files, so we don't need to do it explicitly.
-                cleanShutdown = false;
-                abandonSegment(truncatedTime, sink);
-              }
-            }
-            finally {
-              if (mergeStopwatch != null) {
-                mergeStopwatch.stop();
-              }
-            }
-          }
-        }
-    );
-    handoffNotifier.registerSegmentHandoffCallback(
-        new SegmentDescriptor(sink.getInterval(), sink.getVersion(), config.getShardSpec().getPartitionNum()),
-        mergeExecutor, new Runnable()
-        {
-          @Override
-          public void run()
-          {
-            abandonSegment(sink.getInterval().getStartMillis(), sink);
-            metrics.incrementHandOffCount();
-          }
-        }
-    );
-  }
-
-  @Override
-  public void finishJob()
-  {
-    log.info("Shutting down...");
-
-    shuttingDown = true;
-
-    for (final Map.Entry<Long, Sink> entry : sinks.entrySet()) {
-      entry.getValue().clearDedupCache();
-      persistAndMerge(entry.getKey(), entry.getValue());
-    }
-
-    final long forceEndWaitTime = System.currentTimeMillis() + config.getHandoffConditionTimeout();
-    while (!sinks.isEmpty()) {
-      try {
-        log.info(
-            "Cannot shut down yet! Sinks remaining: %s",
-            Collections2.transform(sinks.values(), sink -> sink.getSegment().getId())
-        );
-
-        synchronized (handoffCondition) {
-          while (!sinks.isEmpty()) {
-            if (config.getHandoffConditionTimeout() == 0) {
-              handoffCondition.wait();
-            } else {
-              long curr = System.currentTimeMillis();
-              if (forceEndWaitTime - curr > 0) {
-                handoffCondition.wait(forceEndWaitTime - curr);
-              } else {
-                throw new ISE(
-                    "Segment handoff wait timeout. [%s] segments might not have completed handoff.",
-                    sinks.size()
-                );
-              }
-            }
-          }
-        }
-      }
-      catch (InterruptedException e) {
-        throw new RuntimeException(e);
-      }
-    }
-
-    handoffNotifier.close();
-    shutdownExecutors();
-
-    stopped = true;
-
-    if (!cleanShutdown) {
-      throw new ISE("Exception occurred during persist and merge.");
-    }
-  }
-
-  private void resetNextFlush()
-  {
-    nextFlush = DateTimes.nowUtc().plus(config.getIntermediatePersistPeriod()).getMillis();
-  }
-
-  protected void initializeExecutors()
-  {
-    final int maxPendingPersists = config.getMaxPendingPersists();
-
-    if (persistExecutor == null) {
-      // use a blocking single threaded executor to throttle the firehose when write to disk is slow
-      persistExecutor = Execs.newBlockingSingleThreaded(
-          "plumber_persist_%d",
-          maxPendingPersists,
-          TaskThreadPriority.getThreadPriorityFromTaskPriority(config.getPersistThreadPriority())
-      );
-    }
-    if (mergeExecutor == null) {
-      // use a blocking single threaded executor to throttle the firehose when write to disk is slow
-      mergeExecutor = Execs.newBlockingSingleThreaded(
-          "plumber_merge_%d",
-          1,
-          TaskThreadPriority.getThreadPriorityFromTaskPriority(config.getMergeThreadPriority())
-      );
-    }
-
-    if (scheduledExecutor == null) {
-      scheduledExecutor = Execs.scheduledSingleThreaded("plumber_scheduled_%d");
-    }
-  }
-
-  protected void shutdownExecutors()
-  {
-    // scheduledExecutor is shutdown here
-    if (scheduledExecutor != null) {
-      scheduledExecutor.shutdown();
-      persistExecutor.shutdown();
-      mergeExecutor.shutdown();
-    }
-  }
-
-  protected Object bootstrapSinksFromDisk()
-  {
-    final VersioningPolicy versioningPolicy = config.getVersioningPolicy();
-
-    File baseDir = computeBaseDir(schema);
-    if (baseDir == null || !baseDir.exists()) {
-      return null;
-    }
-
-    File[] files = baseDir.listFiles();
-    if (files == null) {
-      return null;
-    }
-
-    Object metadata = null;
-    long latestCommitTime = 0;
-    for (File sinkDir : files) {
-      final Interval sinkInterval = Intervals.of(sinkDir.getName().replace('_', '/'));
-
-      //final File[] sinkFiles = sinkDir.listFiles();
-      // To avoid reading and listing of "merged" dir
-      final File[] sinkFiles = sinkDir.listFiles(
-          new FilenameFilter()
-          {
-            @Override
-            public boolean accept(File dir, String fileName)
-            {
-              return !(Ints.tryParse(fileName) == null);
-            }
-          }
-      );
-      Arrays.sort(
-          sinkFiles,
-          new Comparator<File>()
-          {
-            @Override
-            public int compare(File o1, File o2)
-            {
-              try {
-                return Ints.compare(Integer.parseInt(o1.getName()), Integer.parseInt(o2.getName()));
-              }
-              catch (NumberFormatException e) {
-                log.error(e, "Couldn't compare as numbers? [%s][%s]", o1, o2);
-                return o1.compareTo(o2);
-              }
-            }
-          }
-      );
-      boolean isCorrupted = false;
-      List<FireHydrant> hydrants = new ArrayList<>();
-      for (File segmentDir : sinkFiles) {
-        log.info("Loading previously persisted segment at [%s]", segmentDir);
-
-        // Although this has been tackled at start of this method.
-        // Just a doubly-check added to skip "merged" dir. from being added to hydrants
-        // If 100% sure that this is not needed, this check can be removed.
-        if (Ints.tryParse(segmentDir.getName()) == null) {
-          continue;
-        }
-        QueryableIndex queryableIndex = null;
-        try {
-          queryableIndex = indexIO.loadIndex(segmentDir);
-        }
-        catch (IOException e) {
-          log.error(e, "Problem loading segmentDir from disk.");
-          isCorrupted = true;
-        }
-        if (isCorrupted) {
-          try {
-            File corruptSegmentDir = computeCorruptedFileDumpDir(segmentDir, schema);
-            log.info("Renaming %s to %s", segmentDir.getAbsolutePath(), corruptSegmentDir.getAbsolutePath());
-            org.apache.commons.io.FileUtils.copyDirectory(segmentDir, corruptSegmentDir);
-            FileUtils.deleteDirectory(segmentDir);
-          }
-          catch (Exception e1) {
-            log.error(e1, "Failed to rename %s", segmentDir.getAbsolutePath());
-          }
-          //Note: skipping corrupted segment might lead to dropping some data. This strategy should be changed
-          //at some point.
-          continue;
-        }
-        Metadata segmentMetadata = queryableIndex.getMetadata();
-        if (segmentMetadata != null) {
-          Object timestampObj = segmentMetadata.get(COMMIT_METADATA_TIMESTAMP_KEY);
-          if (timestampObj != null) {
-            long timestamp = ((Long) timestampObj).longValue();
-            if (timestamp > latestCommitTime) {
-              log.info(
-                  "Found metaData [%s] with latestCommitTime [%s] greater than previous recorded [%s]",
-                  queryableIndex.getMetadata(),
-                  timestamp,
-                  latestCommitTime
-              );
-              latestCommitTime = timestamp;
-              metadata = queryableIndex.getMetadata().get(COMMIT_METADATA_KEY);
-            }
-          }
-        }
-        hydrants.add(
-            new FireHydrant(
-                new QueryableIndexSegment(
-                    queryableIndex,
-                    SegmentId.of(
-                        schema.getDataSource(),
-                        sinkInterval,
-                        versioningPolicy.getVersion(sinkInterval),
-                        config.getShardSpec()
-                    )
-                ),
-                Integer.parseInt(segmentDir.getName())
-            )
-        );
-      }
-      if (hydrants.isEmpty()) {
-        // Probably encountered a corrupt sink directory
-        log.warn(
-            "Found persisted segment directory with no intermediate segments present at %s, skipping sink creation.",
-            sinkDir.getAbsolutePath()
-        );
-        continue;
-      }
-      final Sink currSink = new Sink(
-          sinkInterval,
-          schema,
-          config.getShardSpec(),
-          versioningPolicy.getVersion(sinkInterval),
-          config.getAppendableIndexSpec(),
-          config.getMaxRowsInMemory(),
-          config.getMaxBytesInMemoryOrDefault(),
-          true,
-          config.getDedupColumn(),
-          hydrants
-      );
-      addSink(currSink);
-    }
-    return metadata;
-  }
-
-  private void addSink(final Sink sink)
-  {
-    sinks.put(sink.getInterval().getStartMillis(), sink);
-    metrics.setSinkCount(sinks.size());
-    sinkTimeline.add(
-        sink.getInterval(),
-        sink.getVersion(),
-        new SingleElementPartitionChunk<>(sink)
-    );
-    try {
-      segmentAnnouncer.announceSegment(sink.getSegment());
-    }
-    catch (IOException e) {
-      log.makeAlert(e, "Failed to announce new segment[%s]", schema.getDataSource())
-         .addData("interval", sink.getInterval())
-         .emit();
-    }
-    clearDedupCache();
-  }
-
-  protected void startPersistThread()
-  {
-    final Granularity segmentGranularity = schema.getGranularitySpec().getSegmentGranularity();
-    final Period windowPeriod = config.getWindowPeriod();
-
-    final DateTime truncatedNow = segmentGranularity.bucketStart(DateTimes.nowUtc());
-    final long windowMillis = windowPeriod.toStandardDuration().getMillis();
-
-    log.info(
-        "Expect to run at [%s]",
-        DateTimes.nowUtc().plus(
-            new Duration(
-                System.currentTimeMillis(),
-                segmentGranularity.increment(truncatedNow).getMillis() + windowMillis
-            )
-        )
-    );
-
-    String threadName = StringUtils.format(
-        "%s-overseer-%d",
-        schema.getDataSource(),
-        config.getShardSpec().getPartitionNum()
-    );
-    ThreadRenamingCallable<ScheduledExecutors.Signal> threadRenamingCallable =
-        new ThreadRenamingCallable<ScheduledExecutors.Signal>(threadName)
-        {
-          @Override
-          public ScheduledExecutors.Signal doCall()
-          {
-            if (stopped) {
-              log.info("Stopping merge-n-push overseer thread");
-              return ScheduledExecutors.Signal.STOP;
-            }
-
-            mergeAndPush();
-
-            if (stopped) {
-              log.info("Stopping merge-n-push overseer thread");
-              return ScheduledExecutors.Signal.STOP;
-            } else {
-              return ScheduledExecutors.Signal.REPEAT;
-            }
-          }
-        };
-    Duration initialDelay = new Duration(
-        System.currentTimeMillis(),
-        segmentGranularity.increment(truncatedNow).getMillis() + windowMillis
-    );
-    Duration rate = new Duration(truncatedNow, segmentGranularity.increment(truncatedNow));
-    ScheduledExecutors.scheduleAtFixedRate(scheduledExecutor, initialDelay, rate, threadRenamingCallable);
-  }
-
-  private void clearDedupCache()
-  {
-    long minTimestamp = getAllowedMinTime().getMillis();
-
-    for (Map.Entry<Long, Sink> entry : sinks.entrySet()) {
-      final Long intervalStart = entry.getKey();
-      if (intervalStart < minTimestamp) {
-        entry.getValue().clearDedupCache();
-      }
-    }
-  }
-
-  private DateTime getAllowedMinTime()
-  {
-    final Granularity segmentGranularity = schema.getGranularitySpec().getSegmentGranularity();
-    final Period windowPeriod = config.getWindowPeriod();
-
-    final long windowMillis = windowPeriod.toStandardDuration().getMillis();
-    return segmentGranularity.bucketStart(
-        DateTimes.utc(Math.max(windowMillis, rejectionPolicy.getCurrMaxTime().getMillis()) - windowMillis)
-    );
-  }
-
-  private void mergeAndPush()
-  {
-    log.info("Starting merge and push.");
-    DateTime minTimestampAsDate = getAllowedMinTime();
-    long minTimestamp = minTimestampAsDate.getMillis();
-
-    log.info(
-        "Found [%,d] segments. Attempting to hand off segments that start before [%s].",
-        sinks.size(),
-        minTimestampAsDate
-    );
-
-    List<Map.Entry<Long, Sink>> sinksToPush = new ArrayList<>();
-    for (Map.Entry<Long, Sink> entry : sinks.entrySet()) {
-      final Long intervalStart = entry.getKey();
-      if (intervalStart < minTimestamp) {
-        log.info("Adding entry [%s] for merge and push.", entry);
-        sinksToPush.add(entry);
-        entry.getValue().clearDedupCache();
-      } else {
-        log.info(
-            "Skipping persist and merge for entry [%s] : Start time [%s] >= [%s] min timestamp required in this run. Segment will be picked up in a future run.",
-            entry,
-            DateTimes.utc(intervalStart),
-            minTimestampAsDate
-        );
-      }
-    }
-
-    log.info("Found [%,d] sinks to persist and merge", sinksToPush.size());
-
-    for (final Map.Entry<Long, Sink> entry : sinksToPush) {
-      persistAndMerge(entry.getKey(), entry.getValue());
-    }
-  }
-
-  /**
-   * Unannounces a given sink and removes all local references to it. It is important that this is only called
-   * from the single-threaded mergeExecutor, since otherwise chaos may ensue if merged segments are deleted while
-   * being created.
-   *
-   * @param truncatedTime sink key
-   * @param sink          sink to unannounce
-   */
-  protected void abandonSegment(final long truncatedTime, final Sink sink)
-  {
-    if (sinks.containsKey(truncatedTime)) {
-      try {
-        segmentAnnouncer.unannounceSegment(sink.getSegment());
-        removeSegment(sink, computePersistDir(schema, sink.getInterval()));
-        log.info("Removing sinkKey %d for segment %s", truncatedTime, sink.getSegment().getId());
-        sinks.remove(truncatedTime);
-        metrics.setSinkCount(sinks.size());
-        sinkTimeline.remove(
-            sink.getInterval(),
-            sink.getVersion(),
-            new SingleElementPartitionChunk<>(sink)
-        );
-        for (FireHydrant hydrant : sink) {
-          cache.close(SinkQuerySegmentWalker.makeHydrantCacheIdentifier(hydrant));
-          hydrant.swapSegment(null);
-        }
-        synchronized (handoffCondition) {
-          handoffCondition.notifyAll();
-        }
-      }
-      catch (Exception e) {
-        log.makeAlert(e, "Unable to abandon old segment for dataSource[%s]", schema.getDataSource())
-           .addData("interval", sink.getInterval())
-           .emit();
-      }
-    }
-  }
-
-  protected File computeBaseDir(DataSchema schema)
-  {
-    return new File(config.getBasePersistDirectory(), schema.getDataSource());
-  }
-
-  protected File computeCorruptedFileDumpDir(File persistDir, DataSchema schema)
-  {
-    return new File(
-        StringUtils.replace(
-            persistDir.getAbsolutePath(),
-            schema.getDataSource(),
-            "corrupted" + File.pathSeparator + schema.getDataSource()
-        )
-    );
-  }
-
-  protected File computePersistDir(DataSchema schema, Interval interval)
-  {
-    return new File(computeBaseDir(schema), interval.toString().replace('/', '_'));
-  }
-
-  /**
-   * Persists the given hydrant and returns the number of rows persisted
-   *
-   * @param indexToPersist hydrant to persist
-   * @param schema         datasource schema
-   * @param interval       interval to persist
-   *
-   * @return the number of rows persisted
-   */
-  protected int persistHydrant(
-      FireHydrant indexToPersist,
-      DataSchema schema,
-      Interval interval,
-      Map<String, Object> metadataElems
-  )
-  {
-    synchronized (indexToPersist) {
-      if (indexToPersist.hasSwapped()) {
-        log.info(
-            "DataSource[%s], Interval[%s], Hydrant[%s] already swapped. Ignoring request to persist.",
-            schema.getDataSource(), interval, indexToPersist
-        );
-        return 0;
-      }
-
-      log.info(
-          "DataSource[%s], Interval[%s], Metadata [%s] persisting Hydrant[%s]",
-          schema.getDataSource(),
-          interval,
-          metadataElems,
-          indexToPersist
-      );
-      try {
-        int numRows = indexToPersist.getIndex().size();
-
-        indexToPersist.getIndex().getMetadata().putAll(metadataElems);
-        final File persistedFile = indexMerger.persist(
-            indexToPersist.getIndex(),
-            interval,
-            new File(computePersistDir(schema, interval), String.valueOf(indexToPersist.getCount())),
-            config.getIndexSpecForIntermediatePersists(),
-            config.getSegmentWriteOutMediumFactory()
-        );
-
-        indexToPersist.swapSegment(
-            new QueryableIndexSegment(indexIO.loadIndex(persistedFile), indexToPersist.getSegmentId())
-        );
-        return numRows;
-      }
-      catch (IOException e) {
-        log.makeAlert("dataSource[%s] -- incremental persist failed", schema.getDataSource())
-           .addData("interval", interval)
-           .addData("count", indexToPersist.getCount())
-           .emit();
-
-        throw new RuntimeException(e);
-      }
-    }
-  }
-
-  private void removeSegment(final Sink sink, final File target)
-  {
-    if (target.exists()) {
-      try {
-        log.info("Deleting Index File[%s]", target);
-        FileUtils.deleteDirectory(target);
-      }
-      catch (Exception e) {
-        log.makeAlert(e, "Unable to remove file for dataSource[%s]", schema.getDataSource())
-           .addData("file", target)
-           .addData("interval", sink.getInterval())
-           .emit();
-      }
-    }
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/RealtimePlumberSchool.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/RealtimePlumberSchool.java
deleted file mode 100644
index 8b19153a9de..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/RealtimePlumberSchool.java
+++ /dev/null
@@ -1,136 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.annotation.JacksonInject;
-import com.fasterxml.jackson.annotation.JsonCreator;
-import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.base.Preconditions;
-import org.apache.druid.client.cache.Cache;
-import org.apache.druid.client.cache.CacheConfig;
-import org.apache.druid.client.cache.CachePopulatorStats;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.query.QueryProcessingPool;
-import org.apache.druid.query.QueryRunnerFactoryConglomerate;
-import org.apache.druid.segment.IndexIO;
-import org.apache.druid.segment.IndexMergerV9;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.join.JoinableFactory;
-import org.apache.druid.segment.loading.DataSegmentPusher;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.segment.realtime.SegmentPublisher;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-
-/**
- *
- */
-public class RealtimePlumberSchool implements PlumberSchool
-{
-  private final ServiceEmitter emitter;
-  private final QueryRunnerFactoryConglomerate conglomerate;
-  private final DataSegmentPusher dataSegmentPusher;
-  private final DataSegmentAnnouncer segmentAnnouncer;
-  private final SegmentPublisher segmentPublisher;
-  private final SegmentHandoffNotifierFactory handoffNotifierFactory;
-  private final QueryProcessingPool queryProcessingPool;
-  private final JoinableFactory joinableFactory;
-  private final IndexMergerV9 indexMergerV9;
-  private final IndexIO indexIO;
-  private final Cache cache;
-  private final CacheConfig cacheConfig;
-  private final CachePopulatorStats cachePopulatorStats;
-  private final ObjectMapper objectMapper;
-
-  @JsonCreator
-  public RealtimePlumberSchool(
-      @JacksonInject ServiceEmitter emitter,
-      @JacksonInject QueryRunnerFactoryConglomerate conglomerate,
-      @JacksonInject DataSegmentPusher dataSegmentPusher,
-      @JacksonInject DataSegmentAnnouncer segmentAnnouncer,
-      @JacksonInject SegmentPublisher segmentPublisher,
-      @JacksonInject SegmentHandoffNotifierFactory handoffNotifierFactory,
-      @JacksonInject QueryProcessingPool queryProcessingPool,
-      @JacksonInject JoinableFactory joinableFactory,
-      @JacksonInject IndexMergerV9 indexMergerV9,
-      @JacksonInject IndexIO indexIO,
-      @JacksonInject Cache cache,
-      @JacksonInject CacheConfig cacheConfig,
-      @JacksonInject CachePopulatorStats cachePopulatorStats,
-      @JacksonInject ObjectMapper objectMapper
-  )
-  {
-    this.emitter = emitter;
-    this.conglomerate = conglomerate;
-    this.dataSegmentPusher = dataSegmentPusher;
-    this.segmentAnnouncer = segmentAnnouncer;
-    this.segmentPublisher = segmentPublisher;
-    this.handoffNotifierFactory = handoffNotifierFactory;
-    this.queryProcessingPool = queryProcessingPool;
-    this.joinableFactory = joinableFactory;
-    this.indexMergerV9 = Preconditions.checkNotNull(indexMergerV9, "Null IndexMergerV9");
-    this.indexIO = Preconditions.checkNotNull(indexIO, "Null IndexIO");
-
-    this.cache = cache;
-    this.cacheConfig = cacheConfig;
-    this.cachePopulatorStats = cachePopulatorStats;
-    this.objectMapper = objectMapper;
-  }
-
-  @Override
-  public Plumber findPlumber(
-      final DataSchema schema,
-      final RealtimeTuningConfig config,
-      final FireDepartmentMetrics metrics
-  )
-  {
-    verifyState();
-
-    return new RealtimePlumber(
-        schema,
-        config,
-        metrics,
-        emitter,
-        conglomerate,
-        segmentAnnouncer,
-        queryProcessingPool,
-        dataSegmentPusher,
-        segmentPublisher,
-        handoffNotifierFactory.createSegmentHandoffNotifier(schema.getDataSource()),
-        indexMergerV9,
-        indexIO,
-        cache,
-        cacheConfig,
-        cachePopulatorStats,
-        objectMapper
-    );
-  }
-
-  private void verifyState()
-  {
-    Preconditions.checkNotNull(conglomerate, "must specify a queryRunnerFactoryConglomerate to do this action.");
-    Preconditions.checkNotNull(dataSegmentPusher, "must specify a segmentPusher to do this action.");
-    Preconditions.checkNotNull(segmentAnnouncer, "must specify a segmentAnnouncer to do this action.");
-    Preconditions.checkNotNull(segmentPublisher, "must specify a segmentPublisher to do this action.");
-    Preconditions.checkNotNull(handoffNotifierFactory, "must specify a handoffNotifierFactory to do this action.");
-    Preconditions.checkNotNull(emitter, "must specify a serviceEmitter to do this action.");
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/RejectionPolicy.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/RejectionPolicy.java
deleted file mode 100644
index e1dd6185bef..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/RejectionPolicy.java
+++ /dev/null
@@ -1,28 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import org.joda.time.DateTime;
-
-public interface RejectionPolicy
-{
-  DateTime getCurrMaxTime();
-  boolean accept(long timestamp);
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/RejectionPolicyFactory.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/RejectionPolicyFactory.java
deleted file mode 100644
index f9b559f179d..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/RejectionPolicyFactory.java
+++ /dev/null
@@ -1,35 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.annotation.JsonSubTypes;
-import com.fasterxml.jackson.annotation.JsonTypeInfo;
-import org.joda.time.Period;
-
-@JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type")
-@JsonSubTypes(value = {
-    @JsonSubTypes.Type(name = "serverTime", value = ServerTimeRejectionPolicyFactory.class),
-    @JsonSubTypes.Type(name = "messageTime", value = MessageTimeRejectionPolicyFactory.class),
-    @JsonSubTypes.Type(name = "none", value = NoopRejectionPolicyFactory.class)
-})
-public interface RejectionPolicyFactory
-{
-  RejectionPolicy create(Period windowPeriod);
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/ServerTimeRejectionPolicyFactory.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/ServerTimeRejectionPolicyFactory.java
deleted file mode 100644
index 9cbd2cca23f..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/ServerTimeRejectionPolicyFactory.java
+++ /dev/null
@@ -1,60 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.StringUtils;
-import org.joda.time.DateTime;
-import org.joda.time.Period;
-
-public class ServerTimeRejectionPolicyFactory implements RejectionPolicyFactory
-{
-  @Override
-  public RejectionPolicy create(final Period windowPeriod)
-  {
-    final long windowMillis = windowPeriod.toStandardDuration().getMillis();
-
-    return new RejectionPolicy()
-    {
-      @Override
-      public DateTime getCurrMaxTime()
-      {
-        return DateTimes.nowUtc();
-      }
-
-      @Override
-      public boolean accept(long timestamp)
-      {
-        long now = System.currentTimeMillis();
-
-        boolean notTooOld = timestamp >= (now - windowMillis);
-        boolean notTooYoung = timestamp <= (now + windowMillis);
-
-        return notTooOld && notTooYoung;
-      }
-
-      @Override
-      public String toString()
-      {
-        return StringUtils.format("serverTime-%s", windowPeriod);
-      }
-    };
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/VersioningPolicy.java b/server/src/main/java/org/apache/druid/segment/realtime/plumber/VersioningPolicy.java
deleted file mode 100644
index 7d6e539f33a..00000000000
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/VersioningPolicy.java
+++ /dev/null
@@ -1,35 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.annotation.JsonSubTypes;
-import com.fasterxml.jackson.annotation.JsonTypeInfo;
-import org.joda.time.Interval;
-
-@JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type")
-@JsonSubTypes(value = {
-    @JsonSubTypes.Type(name = "intervalStart", value = IntervalStartVersioningPolicy.class),
-    @JsonSubTypes.Type(name = "custom", value = CustomVersioningPolicy.class)
-
-})
-public interface VersioningPolicy
-{
-  String getVersion(Interval interval);
-}
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/Committers.java b/server/src/main/java/org/apache/druid/segment/realtime/sink/Committers.java
similarity index 96%
rename from server/src/main/java/org/apache/druid/segment/realtime/plumber/Committers.java
rename to server/src/main/java/org/apache/druid/segment/realtime/sink/Committers.java
index aa0bcbe50fb..8efd117b06c 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/Committers.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/sink/Committers.java
@@ -17,7 +17,7 @@
  * under the License.
  */
 
-package org.apache.druid.segment.realtime.plumber;
+package org.apache.druid.segment.realtime.sink;
 
 import com.google.common.base.Supplier;
 import com.google.common.base.Suppliers;
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/Sink.java b/server/src/main/java/org/apache/druid/segment/realtime/sink/Sink.java
similarity index 92%
rename from server/src/main/java/org/apache/druid/segment/realtime/plumber/Sink.java
rename to server/src/main/java/org/apache/druid/segment/realtime/sink/Sink.java
index 4035f606434..44d0db3cb7f 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/Sink.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/sink/Sink.java
@@ -17,7 +17,7 @@
  * under the License.
  */
 
-package org.apache.druid.segment.realtime.plumber;
+package org.apache.druid.segment.realtime.sink;
 
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Predicate;
@@ -60,13 +60,11 @@ import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
-import java.util.HashSet;
 import java.util.Iterator;
 import java.util.LinkedHashSet;
 import java.util.List;
 import java.util.Map;
 import java.util.Optional;
-import java.util.Set;
 import java.util.concurrent.CopyOnWriteArrayList;
 import java.util.concurrent.atomic.AtomicInteger;
 import java.util.concurrent.atomic.AtomicLong;
@@ -74,6 +72,8 @@ import java.util.function.Function;
 
 public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
 {
+  private static final IncrementalIndexAddResult NOT_WRITABLE = new IncrementalIndexAddResult(-1, -1, "not writable");
+
   private static final IncrementalIndexAddResult ALREADY_SWAPPED =
       new IncrementalIndexAddResult(-1, -1, "write after index swapped");
   private static final Logger log = new Logger(Sink.class);
@@ -98,8 +98,6 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
   private final Map<String, ColumnType> columnTypeExcludingCurrIndex = new HashMap<>();
 
   private final AtomicInteger numRowsExcludingCurrIndex = new AtomicInteger();
-  private final String dedupColumn;
-  private final Set<Long> dedupSet = new HashSet<>();
 
   private volatile FireHydrant currHydrant;
   private volatile boolean writable = true;
@@ -112,8 +110,7 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
       AppendableIndexSpec appendableIndexSpec,
       int maxRowsInMemory,
       long maxBytesInMemory,
-      boolean useMaxMemoryEstimates,
-      String dedupColumn
+      boolean useMaxMemoryEstimates
   )
   {
     this(
@@ -125,7 +122,6 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
         maxRowsInMemory,
         maxBytesInMemory,
         useMaxMemoryEstimates,
-        dedupColumn,
         Collections.emptyList()
     );
   }
@@ -139,7 +135,6 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
       int maxRowsInMemory,
       long maxBytesInMemory,
       boolean useMaxMemoryEstimates,
-      String dedupColumn,
       List<FireHydrant> hydrants
   )
   {
@@ -151,7 +146,6 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
     this.maxRowsInMemory = maxRowsInMemory;
     this.maxBytesInMemory = maxBytesInMemory;
     this.useMaxMemoryEstimates = useMaxMemoryEstimates;
-    this.dedupColumn = dedupColumn;
 
     int maxCount = -1;
     for (int i = 0; i < hydrants.size(); ++i) {
@@ -175,11 +169,6 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
     makeNewCurrIndex(interval.getStartMillis(), schema);
   }
 
-  public void clearDedupCache()
-  {
-    dedupSet.clear();
-  }
-
   public Interval getInterval()
   {
     return interval;
@@ -198,7 +187,7 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
 
     synchronized (hydrantLock) {
       if (!writable) {
-        return Plumber.NOT_WRITABLE;
+        return NOT_WRITABLE;
       }
 
       IncrementalIndex index = currHydrant.getIndex();
@@ -206,10 +195,6 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
         return ALREADY_SWAPPED; // the hydrant was swapped without being replaced
       }
 
-      if (checkInDedupSet(row)) {
-        return Plumber.DUPLICATE;
-      }
-
       return index.add(row, skipMaxRowsInMemoryCheck);
     }
   }
@@ -267,7 +252,6 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
         return false;
       }
       writable = false;
-      clearDedupCache();
     }
     return true;
   }
@@ -334,41 +318,6 @@ public class Sink implements Iterable<FireHydrant>, Overshadowable<Sink>
     return acquireSegmentReferences(hydrants, segmentMapFn, skipIncrementalSegment);
   }
 
-  private boolean checkInDedupSet(InputRow row)
-  {
-    if (dedupColumn != null) {
-      Object value = row.getRaw(dedupColumn);
-      if (value != null) {
-        if (value instanceof List) {
-          throw new IAE("Dedup on multi-value field not support");
-        }
-        Long pk;
-        if (value instanceof Long || value instanceof Integer) {
-          pk = ((Number) value).longValue();
-        } else {
-          // use long type hashcode to reduce heap cost.
-          // maybe hash collision, but it's more important to avoid OOM
-          pk = pkHash(String.valueOf(value));
-        }
-        if (dedupSet.contains(pk)) {
-          return true;
-        }
-        dedupSet.add(pk);
-      }
-    }
-    return false;
-  }
-
-  private long pkHash(String s)
-  {
-    long seed = 131; // 31 131 1313 13131 131313 etc..  BKDRHash
-    long hash = 0;
-    for (int i = 0; i < s.length(); i++) {
-      hash = (hash * seed) + s.charAt(i);
-    }
-    return hash;
-  }
-
   private FireHydrant makeNewCurrIndex(long minTimestamp, DataSchema schema)
   {
     final IncrementalIndexSchema indexSchema = new IncrementalIndexSchema.Builder()
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/plumber/SinkSegmentReference.java b/server/src/main/java/org/apache/druid/segment/realtime/sink/SinkSegmentReference.java
similarity index 97%
rename from server/src/main/java/org/apache/druid/segment/realtime/plumber/SinkSegmentReference.java
rename to server/src/main/java/org/apache/druid/segment/realtime/sink/SinkSegmentReference.java
index 10dfc2b275e..c24cf118661 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/plumber/SinkSegmentReference.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/sink/SinkSegmentReference.java
@@ -17,7 +17,7 @@
  * under the License.
  */
 
-package org.apache.druid.segment.realtime.plumber;
+package org.apache.druid.segment.realtime.sink;
 
 
 import org.apache.druid.segment.SegmentReference;
diff --git a/server/src/main/java/org/apache/druid/server/coordination/DataSegmentAnnouncer.java b/server/src/main/java/org/apache/druid/server/coordination/DataSegmentAnnouncer.java
index bf708206651..08368cbcabe 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/DataSegmentAnnouncer.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/DataSegmentAnnouncer.java
@@ -29,11 +29,11 @@ public interface DataSegmentAnnouncer
 {
   void announceSegment(DataSegment segment) throws IOException;
 
-  void unannounceSegment(DataSegment segment) throws IOException;
+  void unannounceSegment(DataSegment segment);
 
   void announceSegments(Iterable<DataSegment> segments) throws IOException;
 
-  void unannounceSegments(Iterable<DataSegment> segments) throws IOException;
+  void unannounceSegments(Iterable<DataSegment> segments);
 
   /**
    * Announces schema associated with all segments for the specified realtime task.
diff --git a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
index 20a74e6c026..4c2fc76533e 100644
--- a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
+++ b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
@@ -582,7 +582,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testTransactionalAnnounceFailDbNullWantNotNull() throws IOException
+  public void testTransactionalAnnounceFailDbNullWantNotNull()
   {
     final SegmentPublishResult result1 = coordinator.commitSegmentsAndMetadata(
         ImmutableSet.of(defaultSegment),
@@ -604,7 +604,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testTransactionalAnnounceFailDbNotNullWantNull() throws IOException
+  public void testTransactionalAnnounceFailDbNotNullWantNull()
   {
     final SegmentPublishResult result1 = coordinator.commitSegmentsAndMetadata(
         ImmutableSet.of(defaultSegment),
@@ -682,7 +682,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testTransactionalAnnounceFailDbNotNullWantDifferent() throws IOException
+  public void testTransactionalAnnounceFailDbNotNullWantDifferent()
   {
     final SegmentPublishResult result1 = coordinator.commitSegmentsAndMetadata(
         ImmutableSet.of(defaultSegment),
@@ -712,7 +712,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testSimpleUsedList() throws IOException
+  public void testSimpleUsedList()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     Assert.assertEquals(
@@ -728,7 +728,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testMultiIntervalUsedList() throws IOException
+  public void testMultiIntervalUsedList()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     coordinator.commitSegments(ImmutableSet.of(defaultSegment3), new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
@@ -771,7 +771,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUsedSegmentsUsingMultipleIntervals() throws IOException
+  public void testRetrieveUsedSegmentsUsingMultipleIntervals()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     final List<Interval> intervals = segments.stream().map(DataSegment::getInterval).collect(Collectors.toList());
@@ -787,7 +787,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveAllUsedSegmentsUsingIntervalsOutOfRange() throws IOException
+  public void testRetrieveAllUsedSegmentsUsingIntervalsOutOfRange()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1905, 1910);
 
@@ -805,7 +805,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveAllUsedSegmentsUsingNoIntervals() throws IOException
+  public void testRetrieveAllUsedSegmentsUsingNoIntervals()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
 
@@ -819,7 +819,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingSingleIntervalAndNoLimit() throws IOException
+  public void testRetrieveUnusedSegmentsUsingSingleIntervalAndNoLimit()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     markAllSegmentsUnused(new HashSet<>(segments), DateTimes.nowUtc());
@@ -836,7 +836,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingSingleIntervalAndLimitAtRange() throws IOException
+  public void testRetrieveUnusedSegmentsUsingSingleIntervalAndLimitAtRange()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     markAllSegmentsUnused(new HashSet<>(segments), DateTimes.nowUtc());
@@ -854,7 +854,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingSingleIntervalAndLimitInRange() throws IOException
+  public void testRetrieveUnusedSegmentsUsingSingleIntervalAndLimitInRange()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     markAllSegmentsUnused(new HashSet<>(segments), DateTimes.nowUtc());
@@ -872,26 +872,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingSingleIntervalVersionAndLimitInRange() throws IOException
-  {
-    final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
-    markAllSegmentsUnused(new HashSet<>(segments), DateTimes.nowUtc());
-
-    final int requestedLimit = 10;
-    final List<DataSegment> actualUnusedSegments = coordinator.retrieveUnusedSegmentsForInterval(
-        DS.WIKI,
-        Intervals.of("1900/3000"),
-        ImmutableList.of("version"),
-        requestedLimit,
-        null
-    );
-
-    Assert.assertEquals(requestedLimit, actualUnusedSegments.size());
-    Assert.assertTrue(actualUnusedSegments.containsAll(segments.stream().limit(requestedLimit).collect(Collectors.toList())));
-  }
-
-  @Test
-  public void testRetrieveUnusedSegmentsUsingSingleIntervalAndLimitOutOfRange() throws IOException
+  public void testRetrieveUnusedSegmentsUsingSingleIntervalAndLimitOutOfRange()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     markAllSegmentsUnused(new HashSet<>(segments), DateTimes.nowUtc());
@@ -908,7 +889,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingSingleIntervalOutOfRange() throws IOException
+  public void testRetrieveUnusedSegmentsUsingSingleIntervalOutOfRange()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1905, 1910);
     markAllSegmentsUnused(new HashSet<>(segments), DateTimes.nowUtc());
@@ -928,7 +909,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsAndNoLimit() throws IOException
+  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsAndNoLimit()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     DateTime usedStatusLastUpdatedTime = DateTimes.nowUtc();
@@ -958,7 +939,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingNoIntervalsNoLimitAndNoLastSegmentId() throws IOException
+  public void testRetrieveUnusedSegmentsUsingNoIntervalsNoLimitAndNoLastSegmentId()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     DateTime usedStatusLastUpdatedTime = DateTimes.nowUtc();
@@ -988,7 +969,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingNoIntervalsAndNoLimitAndNoLastSegmentId() throws IOException
+  public void testRetrieveUnusedSegmentsUsingNoIntervalsAndNoLimitAndNoLastSegmentId()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(2033, 2133);
     DateTime usedStatusLastUpdatedTime = DateTimes.nowUtc();
@@ -1071,7 +1052,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsAndLimitAtRange() throws IOException
+  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsAndLimitAtRange()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     DateTime usedStatusLastUpdatedTime = DateTimes.nowUtc();
@@ -1101,7 +1082,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsAndLimitInRange() throws IOException
+  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsAndLimitInRange()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     DateTime usedStatusLastUpdatedTime = DateTimes.nowUtc();
@@ -1133,7 +1114,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsInSingleBatchLimitAndLastSegmentId() throws IOException
+  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsInSingleBatchLimitAndLastSegmentId()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(2034, 2133);
     DateTime usedStatusLastUpdatedTime = DateTimes.nowUtc();
@@ -1169,7 +1150,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsLimitAndLastSegmentId() throws IOException
+  public void testRetrieveUnusedSegmentsUsingMultipleIntervalsLimitAndLastSegmentId()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     DateTime usedStatusLastUpdatedTime = DateTimes.nowUtc();
@@ -1205,7 +1186,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingMultipleIntervals() throws IOException
+  public void testRetrieveUnusedSegmentsUsingMultipleIntervals()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 2133);
     DateTime usedStatusLastUpdatedTime = DateTimes.nowUtc();
@@ -1235,7 +1216,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsUsingIntervalOutOfRange() throws IOException
+  public void testRetrieveUnusedSegmentsUsingIntervalOutOfRange()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1905, 1910);
     markAllSegmentsUnused(new HashSet<>(segments), DateTimes.nowUtc());
@@ -1266,7 +1247,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsWithMaxUsedStatusLastUpdatedTime() throws IOException
+  public void testRetrieveUnusedSegmentsWithMaxUsedStatusLastUpdatedTime()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1905, 1910);
     DateTime usedStatusLastUpdatedTime = DateTimes.nowUtc();
@@ -1316,7 +1297,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsWithMaxUsedStatusLastUpdatedTime2() throws IOException
+  public void testRetrieveUnusedSegmentsWithMaxUsedStatusLastUpdatedTime2()
   {
     final List<DataSegment> segments = createAndGetUsedYearSegments(1900, 1950);
     final List<DataSegment> evenYearSegments = new ArrayList<>();
@@ -1381,7 +1362,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testSimpleUnusedList() throws IOException
+  public void testSimpleUnusedList()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     markAllSegmentsUnused();
@@ -1399,7 +1380,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsWithVersions() throws IOException
+  public void testRetrieveUnusedSegmentsWithVersions()
   {
     final DateTime now = DateTimes.nowUtc();
     final String v1 = now.toString();
@@ -1476,7 +1457,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testSimpleUnusedListWithLimit() throws IOException
+  public void testSimpleUnusedListWithLimit()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     markAllSegmentsUnused();
@@ -1495,7 +1476,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUsedOverlapLow() throws IOException
+  public void testUsedOverlapLow()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     Set<DataSegment> actualSegments = ImmutableSet.copyOf(
@@ -1513,7 +1494,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
 
 
   @Test
-  public void testUsedOverlapHigh() throws IOException
+  public void testUsedOverlapHigh()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     Assert.assertEquals(
@@ -1529,7 +1510,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUsedOutOfBoundsLow() throws IOException
+  public void testUsedOutOfBoundsLow()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     Assert.assertTrue(
@@ -1543,7 +1524,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
 
 
   @Test
-  public void testUsedOutOfBoundsHigh() throws IOException
+  public void testUsedOutOfBoundsHigh()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     Assert.assertTrue(
@@ -1556,7 +1537,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUsedWithinBoundsEnd() throws IOException
+  public void testUsedWithinBoundsEnd()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     Assert.assertEquals(
@@ -1572,7 +1553,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUsedOverlapEnd() throws IOException
+  public void testUsedOverlapEnd()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     Assert.assertEquals(
@@ -1588,7 +1569,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUnusedOverlapLow() throws IOException
+  public void testUnusedOverlapLow()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     markAllSegmentsUnused();
@@ -1606,7 +1587,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUnusedUnderlapLow() throws IOException
+  public void testUnusedUnderlapLow()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     markAllSegmentsUnused();
@@ -1622,7 +1603,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
 
 
   @Test
-  public void testUnusedUnderlapHigh() throws IOException
+  public void testUnusedUnderlapHigh()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     markAllSegmentsUnused();
@@ -1637,7 +1618,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUnusedOverlapHigh() throws IOException
+  public void testUnusedOverlapHigh()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     markAllSegmentsUnused();
@@ -1652,7 +1633,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUnusedBigOverlap() throws IOException
+  public void testUnusedBigOverlap()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     markAllSegmentsUnused();
@@ -1670,7 +1651,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUnusedLowRange() throws IOException
+  public void testUnusedLowRange()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     markAllSegmentsUnused();
@@ -1699,7 +1680,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUnusedHighRange() throws IOException
+  public void testUnusedHighRange()
   {
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
     markAllSegmentsUnused();
@@ -1728,7 +1709,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUsedHugeTimeRangeEternityFilter() throws IOException
+  public void testUsedHugeTimeRangeEternityFilter()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1752,7 +1733,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUsedHugeTimeRangeTrickyFilter1() throws IOException
+  public void testUsedHugeTimeRangeTrickyFilter1()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1776,7 +1757,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUsedHugeTimeRangeTrickyFilter2() throws IOException
+  public void testUsedHugeTimeRangeTrickyFilter2()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1800,7 +1781,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testEternitySegmentWithStringComparison() throws IOException
+  public void testEternitySegmentWithStringComparison()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1822,7 +1803,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testEternityMultipleSegmentWithStringComparison() throws IOException
+  public void testEternityMultipleSegmentWithStringComparison()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1845,7 +1826,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testFirstHalfEternitySegmentWithStringComparison() throws IOException
+  public void testFirstHalfEternitySegmentWithStringComparison()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1867,7 +1848,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testFirstHalfEternityMultipleSegmentWithStringComparison() throws IOException
+  public void testFirstHalfEternityMultipleSegmentWithStringComparison()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1890,7 +1871,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testSecondHalfEternitySegmentWithStringComparison() throws IOException
+  public void testSecondHalfEternitySegmentWithStringComparison()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1914,7 +1895,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   // Known Issue: https://github.com/apache/druid/issues/12860
   @Ignore
   @Test
-  public void testLargeIntervalWithStringComparison() throws IOException
+  public void testLargeIntervalWithStringComparison()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1936,7 +1917,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testSecondHalfEternityMultipleSegmentWithStringComparison() throws IOException
+  public void testSecondHalfEternityMultipleSegmentWithStringComparison()
   {
     coordinator.commitSegments(
         ImmutableSet.of(
@@ -1959,7 +1940,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testDeleteDataSourceMetadata() throws IOException
+  public void testDeleteDataSourceMetadata()
   {
     coordinator.commitSegmentsAndMetadata(
         ImmutableSet.of(defaultSegment),
@@ -1980,7 +1961,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testDeleteSegmentsInMetaDataStorage() throws IOException
+  public void testDeleteSegmentsInMetaDataStorage()
   {
     // Published segments to MetaDataStorage
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
@@ -2013,7 +1994,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testUpdateSegmentsInMetaDataStorage() throws IOException
+  public void testUpdateSegmentsInMetaDataStorage()
   {
     // Published segments to MetaDataStorage
     coordinator.commitSegments(SEGMENTS, new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
@@ -2646,7 +2627,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testAllocatePendingSegmentsWithOvershadowingSegments() throws IOException
+  public void testAllocatePendingSegmentsWithOvershadowingSegments()
   {
     final String dataSource = "ds";
     final Interval interval = Intervals.of("2017-01-01/2017-02-01");
@@ -2716,7 +2697,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testAllocatePendingSegmentsForHashBasedNumberedShardSpec() throws IOException
+  public void testAllocatePendingSegmentsForHashBasedNumberedShardSpec()
   {
     final PartialShardSpec partialShardSpec = new HashBasedNumberedPartialShardSpec(null, 2, 5, null);
     final String dataSource = "ds";
@@ -2806,7 +2787,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testAddNumberedShardSpecAfterMultiDimensionsShardSpecWithUnknownCorePartitionSize() throws IOException
+  public void testAddNumberedShardSpecAfterMultiDimensionsShardSpecWithUnknownCorePartitionSize()
   {
     final String datasource = "datasource";
     final Interval interval = Intervals.of("2020-01-01/P1D");
@@ -2850,7 +2831,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testAddNumberedShardSpecAfterSingleDimensionsShardSpecWithUnknownCorePartitionSize() throws IOException
+  public void testAddNumberedShardSpecAfterSingleDimensionsShardSpecWithUnknownCorePartitionSize()
   {
     final String datasource = "datasource";
     final Interval interval = Intervals.of("2020-01-01/P1D");
@@ -2896,7 +2877,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRemoveDataSourceMetadataOlderThanDatasourceActiveShouldNotBeDeleted() throws Exception
+  public void testRemoveDataSourceMetadataOlderThanDatasourceActiveShouldNotBeDeleted()
   {
     coordinator.commitSegmentsAndMetadata(
         ImmutableSet.of(defaultSegment),
@@ -2925,7 +2906,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRemoveDataSourceMetadataOlderThanDatasourceNotActiveAndOlderThanTimeShouldBeDeleted() throws Exception
+  public void testRemoveDataSourceMetadataOlderThanDatasourceNotActiveAndOlderThanTimeShouldBeDeleted()
   {
     coordinator.commitSegmentsAndMetadata(
         ImmutableSet.of(defaultSegment),
@@ -2951,7 +2932,6 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
 
   @Test
   public void testRemoveDataSourceMetadataOlderThanDatasourceNotActiveButNotOlderThanTimeShouldNotBeDeleted()
-      throws Exception
   {
     coordinator.commitSegmentsAndMetadata(
         ImmutableSet.of(defaultSegment),
@@ -2981,7 +2961,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testMarkSegmentsAsUnusedWithinIntervalOneYear() throws IOException
+  public void testMarkSegmentsAsUnusedWithinIntervalOneYear()
   {
     coordinator.commitSegments(ImmutableSet.of(existingSegment1, existingSegment2), new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
 
@@ -3018,7 +2998,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testMarkSegmentsAsUnusedWithinIntervalTwoYears() throws IOException
+  public void testMarkSegmentsAsUnusedWithinIntervalTwoYears()
   {
     coordinator.commitSegments(ImmutableSet.of(existingSegment1, existingSegment2), new SegmentSchemaMapping(CentralizedDatasourceSchemaConfig.SCHEMA_VERSION));
 
@@ -3116,7 +3096,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testTimelineVisibilityWith0CorePartitionTombstone() throws IOException
+  public void testTimelineVisibilityWith0CorePartitionTombstone()
   {
     final Interval interval = Intervals.of("2020/2021");
     // Create and commit a tombstone segment
@@ -3168,7 +3148,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testTimelineWith1CorePartitionTombstone() throws IOException
+  public void testTimelineWith1CorePartitionTombstone()
   {
     // Register the old generation tombstone spec for this test.
     mapper.registerSubtypes(TombstoneShardSpecWith1CorePartition.class);
@@ -3222,7 +3202,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testSegmentIdShouldNotBeReallocated() throws IOException
+  public void testSegmentIdShouldNotBeReallocated()
   {
     final SegmentIdWithShardSpec idWithNullTaskAllocator = coordinator.allocatePendingSegment(
         DS.WIKI,
diff --git a/server/src/test/java/org/apache/druid/metadata/IndexerSqlMetadataStorageCoordinatorTestBase.java b/server/src/test/java/org/apache/druid/metadata/IndexerSqlMetadataStorageCoordinatorTestBase.java
index a2f91378bb7..ce0e0686058 100644
--- a/server/src/test/java/org/apache/druid/metadata/IndexerSqlMetadataStorageCoordinatorTestBase.java
+++ b/server/src/test/java/org/apache/druid/metadata/IndexerSqlMetadataStorageCoordinatorTestBase.java
@@ -52,7 +52,6 @@ import org.skife.jdbi.v2.PreparedBatch;
 import org.skife.jdbi.v2.ResultIterator;
 import org.skife.jdbi.v2.util.StringMapper;
 
-import java.io.IOException;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.HashMap;
@@ -326,7 +325,7 @@ public class IndexerSqlMetadataStorageCoordinatorTestBase
                       .build();
   }
 
-  protected List<DataSegment> createAndGetUsedYearSegments(final int startYear, final int endYear) throws IOException
+  protected List<DataSegment> createAndGetUsedYearSegments(final int startYear, final int endYear)
   {
     final List<DataSegment> segments = new ArrayList<>();
 
diff --git a/server/src/test/java/org/apache/druid/metadata/SQLMetadataRuleManagerTest.java b/server/src/test/java/org/apache/druid/metadata/SQLMetadataRuleManagerTest.java
index 8cdf32bddf9..efeadbdc04e 100644
--- a/server/src/test/java/org/apache/druid/metadata/SQLMetadataRuleManagerTest.java
+++ b/server/src/test/java/org/apache/druid/metadata/SQLMetadataRuleManagerTest.java
@@ -62,7 +62,6 @@ public class SQLMetadataRuleManagerTest
   private MetadataRuleManagerConfig managerConfig;
   private SQLMetadataRuleManager ruleManager;
   private AuditManager auditManager;
-  private SQLMetadataSegmentPublisher publisher;
   private final ObjectMapper mapper = new DefaultObjectMapper();
 
   @Before
@@ -87,11 +86,6 @@ public class SQLMetadataRuleManagerTest
     ruleManager = new SQLMetadataRuleManager(mapper, managerConfig, tablesConfig, connector, auditManager);
     connector.createSegmentSchemasTable();
     connector.createSegmentTable();
-    publisher = new SQLMetadataSegmentPublisher(
-        mapper,
-        derbyConnectorRule.metadataTablesConfigSupplier().get(),
-        connector
-    );
   }
 
   @Test
@@ -321,7 +315,7 @@ public class SQLMetadataRuleManagerTest
         1,
         1234L
     );
-    publisher.publishSegment(dataSegment);
+    SqlSegmentsMetadataManagerTestBase.publishSegment(connector, tablesConfig, mapper, dataSegment);
 
     // This will not delete the rule as the datasource has segment in the segment metadata table
     ruleManager.removeRulesForEmptyDatasourcesOlderThan(System.currentTimeMillis());
diff --git a/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerSchemaPollTest.java b/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerSchemaPollTest.java
index 8595f3e7194..18095305ad9 100644
--- a/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerSchemaPollTest.java
+++ b/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerSchemaPollTest.java
@@ -73,18 +73,13 @@ public class SqlSegmentsMetadataManagerSchemaPollTest extends SqlSegmentsMetadat
         CentralizedDatasourceSchemaConfig.create()
     );
     sqlSegmentsMetadataManager.start();
-
-    publisher = new SQLMetadataSegmentPublisher(
-        jsonMapper,
-        derbyConnectorRule.metadataTablesConfigSupplier().get(),
-        connector
-    );
+    storageConfig = derbyConnectorRule.metadataTablesConfigSupplier().get();
 
     connector.createSegmentSchemasTable();
     connector.createSegmentTable();
 
-    publisher.publishSegment(segment1);
-    publisher.publishSegment(segment2);
+    publishSegment(segment1);
+    publishSegment(segment2);
   }
 
   @After
diff --git a/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerTest.java b/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerTest.java
index 486e58e2a2a..d101a7a74b4 100644
--- a/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerTest.java
+++ b/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerTest.java
@@ -19,7 +19,6 @@
 
 package org.apache.druid.metadata;
 
-import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.base.Optional;
 import com.google.common.base.Suppliers;
 import com.google.common.collect.ImmutableList;
@@ -34,7 +33,6 @@ import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
 import org.apache.druid.segment.metadata.SegmentSchemaCache;
 import org.apache.druid.segment.metadata.SegmentSchemaManager;
@@ -89,10 +87,6 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
   public final TestDerbyConnector.DerbyConnectorRule derbyConnectorRule
       = new TestDerbyConnector.DerbyConnectorRule();
 
-  private SqlSegmentsMetadataManager sqlSegmentsMetadataManager;
-  private SQLMetadataSegmentPublisher publisher;
-  private static final ObjectMapper JSON_MAPPER = TestHelper.makeJsonMapper();
-
   private final DataSegment wikiSegment1 =
       CreateDataSegments.ofDatasource(DS.WIKI).startingAt("2012-03-15").eachOfSizeInMb(500).get(0);
   private final DataSegment wikiSegment2 =
@@ -101,7 +95,7 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
   private void publishUnusedSegments(DataSegment... segments) throws IOException
   {
     for (DataSegment segment : segments) {
-      publisher.publishSegment(segment);
+      publishSegment(segment);
       sqlSegmentsMetadataManager.markSegmentAsUnused(segment.getId());
     }
   }
@@ -109,8 +103,8 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
   private void publishWikiSegments()
   {
     try {
-      publisher.publishSegment(wikiSegment1);
-      publisher.publishSegment(wikiSegment2);
+      publishSegment(wikiSegment1);
+      publishSegment(wikiSegment2);
     }
     catch (Exception e) {
       throw new RuntimeException(e);
@@ -123,6 +117,7 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
     connector = derbyConnectorRule.getConnector();
     SegmentsMetadataManagerConfig config = new SegmentsMetadataManagerConfig();
     config.setPollDuration(Period.seconds(3));
+    storageConfig = derbyConnectorRule.metadataTablesConfigSupplier().get();
 
     segmentSchemaCache = new SegmentSchemaCache(new NoopServiceEmitter());
     segmentSchemaManager = new SegmentSchemaManager(
@@ -131,10 +126,8 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         connector
     );
 
-    final TestDerbyConnector connector = derbyConnectorRule.getConnector();
-
     sqlSegmentsMetadataManager = new SqlSegmentsMetadataManager(
-        JSON_MAPPER,
+        jsonMapper,
         Suppliers.ofInstance(config),
         derbyConnectorRule.metadataTablesConfigSupplier(),
         connector,
@@ -143,12 +136,6 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
     );
     sqlSegmentsMetadataManager.start();
 
-    publisher = new SQLMetadataSegmentPublisher(
-        JSON_MAPPER,
-        derbyConnectorRule.metadataTablesConfigSupplier().get(),
-        connector
-    );
-
     connector.createSegmentSchemasTable();
     connector.createSegmentTable();
   }
@@ -271,7 +258,7 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
                            .map(ImmutableDruidDataSource::getName)
                            .collect(Collectors.toList())
     );
-    publisher.publishSegment(createNewSegment1(DS.KOALA));
+    publishSegment(createNewSegment1(DS.KOALA));
 
     // This call will force on demand poll
     sqlSegmentsMetadataManager.forceOrWaitOngoingDatabasePoll();
@@ -288,7 +275,7 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
     );
 
     final String newDataSource3 = "wikipedia3";
-    publisher.publishSegment(createNewSegment1(newDataSource3));
+    publishSegment(createNewSegment1(newDataSource3));
 
     // This time wait for periodic poll (not doing on demand poll so we have to wait a bit...)
     while (sqlSegmentsMetadataManager.getDataSourcesSnapshot().getDataSource(newDataSource3) == null) {
@@ -367,10 +354,11 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         sqlSegmentsMetadataManager.retrieveAllDataSourceNames()
     );
     final DataSegment koalaSegment = createNewSegment1(DS.KOALA);
-    publisher.publishSegment(koalaSegment);
+    publishSegment(koalaSegment);
     sqlSegmentsMetadataManager.startPollingDatabasePeriodically();
     return koalaSegment;
   }
+
   /**
    * Create a corrupted segment entry in the segments table to test
    * whether the overall loading of segments from the database continues to work
@@ -382,7 +370,7 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
     publishWikiSegments();
 
     final DataSegment corruptSegment = DataSegment.builder(wikiSegment1).dataSource("corrupt-datasource").build();
-    publisher.publishSegment(corruptSegment);
+    publishSegment(corruptSegment);
     updateSegmentPayload(corruptSegment, StringUtils.toUtf8("corrupt-payload"));
 
     EmittingLogger.registerEmitter(new NoopServiceEmitter());
@@ -444,26 +432,56 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
 
     Assert.assertEquals(
         ImmutableList.of(wikiSegment2.getInterval()),
-        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(DS.WIKI, null, DateTimes.of("3000"), 1, DateTimes.COMPARE_DATE_AS_STRING_MAX)
+        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(
+            DS.WIKI,
+            null,
+            DateTimes.of("3000"),
+            1,
+            DateTimes.COMPARE_DATE_AS_STRING_MAX
+        )
     );
 
     // Test the DateTime maxEndTime argument of getUnusedSegmentIntervals
     Assert.assertEquals(
         ImmutableList.of(wikiSegment2.getInterval()),
-        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(DS.WIKI, null, DateTimes.of(2012, 1, 7, 0, 0), 1, DateTimes.COMPARE_DATE_AS_STRING_MAX)
+        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(
+            DS.WIKI,
+            null,
+            DateTimes.of(2012, 1, 7, 0, 0),
+            1,
+            DateTimes.COMPARE_DATE_AS_STRING_MAX
+        )
     );
     Assert.assertEquals(
         ImmutableList.of(wikiSegment1.getInterval()),
-        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(DS.WIKI, DateTimes.of(2012, 1, 7, 0, 0), DateTimes.of(2012, 4, 7, 0, 0), 1, DateTimes.COMPARE_DATE_AS_STRING_MAX)
+        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(
+            DS.WIKI,
+            DateTimes.of(2012, 1, 7, 0, 0),
+            DateTimes.of(2012, 4, 7, 0, 0),
+            1,
+            DateTimes.COMPARE_DATE_AS_STRING_MAX
+        )
     );
     Assert.assertEquals(
         ImmutableList.of(),
-        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(DS.WIKI, DateTimes.of(2012, 1, 7, 0, 0), DateTimes.of(2012, 1, 7, 0, 0), 1, DateTimes.COMPARE_DATE_AS_STRING_MAX)
+        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(
+            DS.WIKI,
+            DateTimes.of(2012, 1, 7, 0, 0),
+            DateTimes.of(2012, 1, 7, 0, 0),
+            1,
+            DateTimes.COMPARE_DATE_AS_STRING_MAX
+        )
     );
 
     Assert.assertEquals(
         ImmutableList.of(wikiSegment2.getInterval(), wikiSegment1.getInterval()),
-        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(DS.WIKI, null, DateTimes.of("3000"), 5, DateTimes.COMPARE_DATE_AS_STRING_MAX)
+        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(
+            DS.WIKI,
+            null,
+            DateTimes.of("3000"),
+            5,
+            DateTimes.COMPARE_DATE_AS_STRING_MAX
+        )
     );
 
     // Test a buffer period that should exclude some segments
@@ -471,7 +489,13 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
     // The wikipedia datasource has segments generated with last used time equal to roughly the time of test run. None of these segments should be selected with a bufer period of 1 day
     Assert.assertEquals(
         ImmutableList.of(),
-        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(DS.WIKI, DateTimes.COMPARE_DATE_AS_STRING_MIN, DateTimes.of("3000"), 5, DateTimes.nowUtc().minus(Duration.parse("PT86400S")))
+        sqlSegmentsMetadataManager.getUnusedSegmentIntervals(
+            DS.WIKI,
+            DateTimes.COMPARE_DATE_AS_STRING_MIN,
+            DateTimes.of("3000"),
+            5,
+            DateTimes.nowUtc().minus(Duration.parse("PT86400S"))
+        )
     );
 
     // koalaSegment3 has a null used_status_last_updated which should mean getUnusedSegmentIntervals never returns it
@@ -496,7 +520,7 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
     sqlSegmentsMetadataManager.poll();
     Assert.assertTrue(sqlSegmentsMetadataManager.isPollingDatabasePeriodically());
 
-    publisher.publishSegment(createNewSegment1(DS.KOALA));
+    publishSegment(createNewSegment1(DS.KOALA));
 
     awaitDataSourceAppeared(DS.KOALA);
     int numChangedSegments = sqlSegmentsMetadataManager.markAsUnusedAllSegmentsInDataSource(DS.KOALA);
@@ -536,7 +560,7 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         "2017-10-15T20:19:12.565Z"
     );
 
-    publisher.publishSegment(koalaSegment);
+    publishSegment(koalaSegment);
     awaitDataSourceAppeared(DS.KOALA);
     Assert.assertNotNull(sqlSegmentsMetadataManager.getImmutableDataSourceWithUsedSegments(DS.KOALA));
 
@@ -1018,8 +1042,8 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
     final DataSegment koalaSegment1 = createNewSegment1(DS.KOALA);
     final DataSegment koalaSegment2 = createNewSegment1(DS.KOALA);
 
-    publisher.publishSegment(koalaSegment1);
-    publisher.publishSegment(koalaSegment2);
+    publishSegment(koalaSegment1);
+    publishSegment(koalaSegment2);
 
     final ImmutableSet<SegmentId> segmentIds =
         ImmutableSet.of(koalaSegment1.getId(), koalaSegment1.getId());
@@ -1048,9 +1072,9 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         "2017-10-15T20:19:12.565Z"
     );
 
-    publisher.publishSegment(koalaSegment1);
-    publisher.publishSegment(koalaSegment2);
-    publisher.publishSegment(koalaSegment3);
+    publishSegment(koalaSegment1);
+    publishSegment(koalaSegment2);
+    publishSegment(koalaSegment3);
     final Interval theInterval = Intervals.of("2017-10-15T00:00:00.000/2017-10-18T00:00:00.000");
 
     // 2 out of 3 segments match the interval
@@ -1091,9 +1115,9 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         v2
     );
 
-    publisher.publishSegment(koalaSegment1);
-    publisher.publishSegment(koalaSegment2);
-    publisher.publishSegment(koalaSegment3);
+    publishSegment(koalaSegment1);
+    publishSegment(koalaSegment2);
+    publishSegment(koalaSegment3);
     final Interval theInterval = Intervals.of("2017-10-15/2017-10-18");
 
     Assert.assertEquals(
@@ -1140,9 +1164,9 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         v2
     );
 
-    publisher.publishSegment(koalaSegment1);
-    publisher.publishSegment(koalaSegment2);
-    publisher.publishSegment(koalaSegment3);
+    publishSegment(koalaSegment1);
+    publishSegment(koalaSegment2);
+    publishSegment(koalaSegment3);
     final Interval theInterval = Intervals.of("2017-10-15/2017-10-18");
 
     Assert.assertEquals(
@@ -1189,9 +1213,9 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         v2
     );
 
-    publisher.publishSegment(koalaSegment1);
-    publisher.publishSegment(koalaSegment2);
-    publisher.publishSegment(koalaSegment3);
+    publishSegment(koalaSegment1);
+    publishSegment(koalaSegment2);
+    publishSegment(koalaSegment3);
     final Interval theInterval = Intervals.of("2017-10-15/2017-10-18");
 
     Assert.assertEquals(
@@ -1238,9 +1262,9 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         v2
     );
 
-    publisher.publishSegment(koalaSegment1);
-    publisher.publishSegment(koalaSegment2);
-    publisher.publishSegment(koalaSegment3);
+    publishSegment(koalaSegment1);
+    publishSegment(koalaSegment2);
+    publishSegment(koalaSegment3);
     final Interval theInterval = Intervals.of("2017-10-15/2017-10-18");
 
     Assert.assertEquals(
@@ -1279,9 +1303,9 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         "2017-10-15T20:19:12.565Z"
     );
 
-    publisher.publishSegment(koalaSegment1);
-    publisher.publishSegment(koalaSegment2);
-    publisher.publishSegment(koalaSegment3);
+    publishSegment(koalaSegment1);
+    publishSegment(koalaSegment2);
+    publishSegment(koalaSegment3);
     final Interval theInterval = Intervals.of("2017-10-16T00:00:00.000/2017-10-20T00:00:00.000");
 
     // 1 out of 3 segments match the interval, other 2 overlap, only the segment fully contained will be marked unused
@@ -1314,7 +1338,7 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
     final SegmentsMetadataManagerConfig config = new SegmentsMetadataManagerConfig();
     config.setPollDuration(Period.seconds(1));
     sqlSegmentsMetadataManager = new SqlSegmentsMetadataManager(
-        JSON_MAPPER,
+        jsonMapper,
         Suppliers.ofInstance(config),
         derbyConnectorRule.metadataTablesConfigSupplier(),
         derbyConnectorRule.getConnector(),
@@ -1335,7 +1359,7 @@ public class SqlSegmentsMetadataManagerTest extends SqlSegmentsMetadataManagerTe
         "2012-03-16T00:00:00.000/2012-03-17T00:00:00.000",
         "2017-10-15T20:19:12.565Z"
     );
-    publisher.publishSegment(wikiSegment3);
+    publishSegment(wikiSegment3);
 
     // New segment is not returned since we call without force poll
     segments = sqlSegmentsMetadataManager
diff --git a/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerTestBase.java b/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerTestBase.java
index f166befde73..18112c29b4c 100644
--- a/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerTestBase.java
+++ b/server/src/test/java/org/apache/druid/metadata/SqlSegmentsMetadataManagerTestBase.java
@@ -22,23 +22,53 @@ package org.apache.druid.metadata;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
+import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.metadata.SegmentSchemaCache;
 import org.apache.druid.segment.metadata.SegmentSchemaManager;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.partition.NoneShardSpec;
+import org.skife.jdbi.v2.DBI;
+import org.skife.jdbi.v2.tweak.HandleCallback;
+
+import java.io.IOException;
+import java.util.List;
+import java.util.Map;
 
 public class SqlSegmentsMetadataManagerTestBase
 {
   protected SqlSegmentsMetadataManager sqlSegmentsMetadataManager;
-  protected SQLMetadataSegmentPublisher publisher;
+
   protected SegmentSchemaCache segmentSchemaCache;
   protected SegmentSchemaManager segmentSchemaManager;
   protected TestDerbyConnector connector;
   protected SegmentsMetadataManagerConfig config;
+  protected MetadataStorageTablesConfig storageConfig;
   protected final ObjectMapper jsonMapper = TestHelper.makeJsonMapper();
 
+  protected final DataSegment segment1 = createSegment(
+      "wikipedia",
+      "2012-03-15T00:00:00.000/2012-03-16T00:00:00.000",
+      "2012-03-16T00:36:30.848Z",
+      "index/y=2012/m=03/d=15/2012-03-16T00:36:30.848Z/0/index.zip",
+      0
+  );
+
+  protected final DataSegment segment2 = createSegment(
+      "wikipedia",
+      "2012-01-05T00:00:00.000/2012-01-06T00:00:00.000",
+      "2012-01-06T22:19:12.565Z",
+      "wikipedia/index/y=2012/m=01/d=05/2012-01-06T22:19:12.565Z/0/index.zip",
+      0
+  );
+
+  protected void publishSegment(final DataSegment segment) throws IOException
+  {
+    publishSegment(connector, storageConfig, jsonMapper, segment);
+  }
+
   protected static DataSegment createSegment(
       String dataSource,
       String interval,
@@ -64,19 +94,86 @@ public class SqlSegmentsMetadataManagerTestBase
     );
   }
 
-  protected final DataSegment segment1 = createSegment(
-      "wikipedia",
-      "2012-03-15T00:00:00.000/2012-03-16T00:00:00.000",
-      "2012-03-16T00:36:30.848Z",
-      "index/y=2012/m=03/d=15/2012-03-16T00:36:30.848Z/0/index.zip",
-      0
-  );
+  public static void publishSegment(
+      final SQLMetadataConnector connector,
+      final MetadataStorageTablesConfig config,
+      final ObjectMapper jsonMapper,
+      final DataSegment segment
+  ) throws IOException
+  {
+    String now = DateTimes.nowUtc().toString();
+    publishSegment(
+        connector,
+        config,
+        segment.getId().toString(),
+        segment.getDataSource(),
+        now,
+        segment.getInterval().getStart().toString(),
+        segment.getInterval().getEnd().toString(),
+        (segment.getShardSpec() instanceof NoneShardSpec) ? false : true,
+        segment.getVersion(),
+        true,
+        jsonMapper.writeValueAsBytes(segment),
+        now
+    );
+  }
 
-  protected final DataSegment segment2 = createSegment(
-      "wikipedia",
-      "2012-01-05T00:00:00.000/2012-01-06T00:00:00.000",
-      "2012-01-06T22:19:12.565Z",
-      "wikipedia/index/y=2012/m=01/d=05/2012-01-06T22:19:12.565Z/0/index.zip",
-      0
-  );
+  private static void publishSegment(
+      final SQLMetadataConnector connector,
+      final MetadataStorageTablesConfig config,
+      final String segmentId,
+      final String dataSource,
+      final String createdDate,
+      final String start,
+      final String end,
+      final boolean partitioned,
+      final String version,
+      final boolean used,
+      final byte[] payload,
+      final String usedFlagLastUpdated
+  )
+  {
+    try {
+      final DBI dbi = connector.getDBI();
+      List<Map<String, Object>> exists = dbi.withHandle(
+          handle ->
+              handle.createQuery(StringUtils.format("SELECT id FROM %s WHERE id=:id", config.getSegmentsTable()))
+                    .bind("id", segmentId)
+                    .list()
+      );
+
+      if (!exists.isEmpty()) {
+        return;
+      }
+
+      final String publishStatement = StringUtils.format(
+          "INSERT INTO %1$s (id, dataSource, created_date, start, %2$send%2$s, partitioned, version, used, payload, used_status_last_updated) "
+          + "VALUES (:id, :dataSource, :created_date, :start, :end, :partitioned, :version, :used, :payload, :used_status_last_updated)",
+          config.getSegmentsTable(),
+          connector.getQuoteString()
+      );
+
+      dbi.withHandle(
+          (HandleCallback<Void>) handle -> {
+            handle.createStatement(publishStatement)
+                  .bind("id", segmentId)
+                  .bind("dataSource", dataSource)
+                  .bind("created_date", createdDate)
+                  .bind("start", start)
+                  .bind("end", end)
+                  .bind("partitioned", partitioned)
+                  .bind("version", version)
+                  .bind("used", used)
+                  .bind("payload", payload)
+                  .bind("used_status_last_updated", usedFlagLastUpdated)
+                  .execute();
+
+            return null;
+          }
+      );
+    }
+    catch (Exception e) {
+      throw new RuntimeException(e);
+    }
+  }
 }
diff --git a/server/src/test/java/org/apache/druid/segment/indexing/RealtimeTuningConfigTest.java b/server/src/test/java/org/apache/druid/segment/indexing/RealtimeTuningConfigTest.java
deleted file mode 100644
index abc95719707..00000000000
--- a/server/src/test/java/org/apache/druid/segment/indexing/RealtimeTuningConfigTest.java
+++ /dev/null
@@ -1,151 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.indexing;
-
-import com.fasterxml.jackson.databind.ObjectMapper;
-import org.apache.druid.segment.IndexSpec;
-import org.apache.druid.segment.TestHelper;
-import org.apache.druid.segment.data.CompressionStrategy;
-import org.apache.druid.segment.incremental.OnheapIncrementalIndex;
-import org.apache.druid.timeline.partition.NumberedShardSpec;
-import org.hamcrest.CoreMatchers;
-import org.joda.time.Duration;
-import org.joda.time.Period;
-import org.junit.Assert;
-import org.junit.Test;
-
-import java.io.File;
-import java.util.UUID;
-
-public class RealtimeTuningConfigTest
-{
-  @Test
-  public void testErrorMessageIsMeaningfulWhenUnableToCreateTemporaryDirectory()
-  {
-    String propertyName = "java.io.tmpdir";
-    String originalValue = System.getProperty(propertyName);
-    String nonExistedDirectory = "/tmp/" + UUID.randomUUID();
-    try {
-      System.setProperty(propertyName, nonExistedDirectory);
-      RealtimeTuningConfig.makeDefaultTuningConfig(null);
-    }
-    catch (IllegalStateException e) {
-      Assert.assertThat(
-          e.getMessage(),
-          CoreMatchers.startsWith("java.io.tmpdir (" + nonExistedDirectory + ") does not exist")
-      );
-    }
-    finally {
-      System.setProperty(propertyName, originalValue);
-    }
-  }
-
-  @Test
-  public void testSpecificBasePersistDirectory()
-  {
-    final RealtimeTuningConfig tuningConfig = RealtimeTuningConfig.makeDefaultTuningConfig(
-        new File("/tmp/nonexistent")
-    );
-    Assert.assertEquals(new File("/tmp/nonexistent"), tuningConfig.getBasePersistDirectory());
-  }
-
-  @Test
-  public void testSerdeWithDefaults() throws Exception
-  {
-    String jsonStr = "{\"type\":\"realtime\"}";
-
-    ObjectMapper mapper = TestHelper.makeJsonMapper();
-    RealtimeTuningConfig config = (RealtimeTuningConfig) mapper.readValue(
-        mapper.writeValueAsString(
-            mapper.readValue(
-                jsonStr,
-                TuningConfig.class
-            )
-        ),
-        TuningConfig.class
-    );
-
-    Assert.assertEquals(new OnheapIncrementalIndex.Spec(), config.getAppendableIndexSpec());
-    Assert.assertEquals(Duration.standardMinutes(15).getMillis(), config.getHandoffConditionTimeout());
-    Assert.assertEquals(0, config.getAlertTimeout());
-    Assert.assertEquals(IndexSpec.DEFAULT, config.getIndexSpec());
-    Assert.assertEquals(IndexSpec.DEFAULT, config.getIndexSpecForIntermediatePersists());
-    Assert.assertEquals(new Period("PT10M"), config.getIntermediatePersistPeriod());
-    Assert.assertEquals(new NumberedShardSpec(0, 1), config.getShardSpec());
-    Assert.assertEquals(0, config.getMaxPendingPersists());
-    Assert.assertEquals(150000, config.getMaxRowsInMemory());
-    Assert.assertEquals(0, config.getMergeThreadPriority());
-    Assert.assertEquals(0, config.getPersistThreadPriority());
-    Assert.assertEquals(new Period("PT10M"), config.getWindowPeriod());
-    Assert.assertFalse(config.isReportParseExceptions());
-  }
-
-  @Test
-  public void testSerdeWithNonDefaults() throws Exception
-  {
-    String jsonStr = "{\n"
-                     + "  \"type\": \"realtime\",\n"
-                     + "  \"maxRowsInMemory\": 100,\n"
-                     + "  \"intermediatePersistPeriod\": \"PT1H\",\n"
-                     + "  \"windowPeriod\": \"PT1H\",\n"
-                     + "  \"maxPendingPersists\": 100,\n"
-                     + "  \"persistThreadPriority\": 100,\n"
-                     + "  \"mergeThreadPriority\": 100,\n"
-                     + "  \"reportParseExceptions\": true,\n"
-                     + "  \"handoffConditionTimeout\": 100,\n"
-                     + "  \"alertTimeout\": 70,\n"
-                     + "  \"indexSpec\": { \"metricCompression\" : \"NONE\" },\n"
-                     + "  \"indexSpecForIntermediatePersists\": { \"dimensionCompression\" : \"uncompressed\" },\n"
-                     + "  \"appendableIndexSpec\": { \"type\" : \"onheap\" }\n"
-                     + "}";
-
-    ObjectMapper mapper = TestHelper.makeJsonMapper();
-    RealtimeTuningConfig config = (RealtimeTuningConfig) mapper.readValue(
-        mapper.writeValueAsString(
-            mapper.readValue(
-                jsonStr,
-                TuningConfig.class
-            )
-        ),
-        TuningConfig.class
-    );
-
-    Assert.assertEquals(new OnheapIncrementalIndex.Spec(), config.getAppendableIndexSpec());
-    Assert.assertEquals(100, config.getHandoffConditionTimeout());
-    Assert.assertEquals(70, config.getAlertTimeout());
-    Assert.assertEquals(new Period("PT1H"), config.getIntermediatePersistPeriod());
-    Assert.assertEquals(new NumberedShardSpec(0, 1), config.getShardSpec());
-    Assert.assertEquals(100, config.getMaxPendingPersists());
-    Assert.assertEquals(100, config.getMaxRowsInMemory());
-    Assert.assertEquals(100, config.getMergeThreadPriority());
-    Assert.assertEquals(100, config.getPersistThreadPriority());
-    Assert.assertEquals(new Period("PT1H"), config.getWindowPeriod());
-    Assert.assertEquals(true, config.isReportParseExceptions());
-    Assert.assertEquals(
-        IndexSpec.builder().withMetricCompression(CompressionStrategy.NONE).build(),
-        config.getIndexSpec()
-    );
-    Assert.assertEquals(
-        IndexSpec.builder().withDimensionCompression(CompressionStrategy.UNCOMPRESSED).build(),
-        config.getIndexSpecForIntermediatePersists()
-    );
-
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/FireDepartmentTest.java b/server/src/test/java/org/apache/druid/segment/realtime/FireDepartmentTest.java
deleted file mode 100644
index 9c37fe7a37c..00000000000
--- a/server/src/test/java/org/apache/druid/segment/realtime/FireDepartmentTest.java
+++ /dev/null
@@ -1,135 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime;
-
-import com.fasterxml.jackson.databind.InjectableValues;
-import com.fasterxml.jackson.databind.ObjectMapper;
-import org.apache.druid.client.cache.CacheConfig;
-import org.apache.druid.client.cache.CachePopulatorStats;
-import org.apache.druid.client.cache.MapCache;
-import org.apache.druid.data.input.impl.DimensionsSpec;
-import org.apache.druid.data.input.impl.JSONParseSpec;
-import org.apache.druid.data.input.impl.StringInputRowParser;
-import org.apache.druid.data.input.impl.TimestampSpec;
-import org.apache.druid.jackson.DefaultObjectMapper;
-import org.apache.druid.java.util.common.granularity.Granularities;
-import org.apache.druid.query.aggregation.AggregatorFactory;
-import org.apache.druid.query.aggregation.CountAggregatorFactory;
-import org.apache.druid.segment.TestHelper;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.apache.druid.segment.join.NoopJoinableFactory;
-import org.apache.druid.segment.realtime.plumber.RealtimePlumberSchool;
-import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
-import org.junit.Assert;
-import org.junit.Test;
-
-import java.io.File;
-import java.util.Arrays;
-import java.util.Map;
-
-/**
- */
-public class FireDepartmentTest
-{
-
-  public static final CacheConfig NO_CACHE_CONFIG = new CacheConfig()
-  {
-    @Override
-    public boolean isPopulateCache()
-    {
-      return false;
-    }
-
-    @Override
-    public boolean isUseCache()
-    {
-      return false;
-    }
-  };
-
-  @Test
-  public void testSerde() throws Exception
-  {
-    ObjectMapper jsonMapper = new DefaultObjectMapper();
-    jsonMapper.setInjectableValues(new InjectableValues.Std().addValue(ObjectMapper.class, jsonMapper));
-
-    FireDepartment schema = new FireDepartment(
-        new DataSchema(
-            "foo",
-            jsonMapper.convertValue(
-                new StringInputRowParser(
-                    new JSONParseSpec(
-                        new TimestampSpec(
-                            "timestamp",
-                            "auto",
-                            null
-                        ),
-                        new DimensionsSpec(
-                            DimensionsSpec.getDefaultSchemas(Arrays.asList("dim1", "dim2"))
-                        ),
-                        null,
-                        null,
-                        null
-                    ),
-                    null
-                ),
-                Map.class
-            ),
-            new AggregatorFactory[]{
-                new CountAggregatorFactory("count")
-            },
-            new UniformGranularitySpec(Granularities.HOUR, Granularities.MINUTE, null),
-            null,
-            jsonMapper
-        ),
-        new RealtimeIOConfig(
-            null,
-            new RealtimePlumberSchool(
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                NoopJoinableFactory.INSTANCE,
-                TestHelper.getTestIndexMergerV9(OffHeapMemorySegmentWriteOutMediumFactory.instance()),
-                TestHelper.getTestIndexIO(),
-                MapCache.create(0),
-                NO_CACHE_CONFIG,
-                new CachePopulatorStats(),
-                TestHelper.makeJsonMapper()
-
-            )
-        ),
-        RealtimeTuningConfig.makeDefaultTuningConfig(new File("/tmp/nonexistent"))
-    );
-
-    String json = jsonMapper.writeValueAsString(schema);
-
-    FireDepartment newSchema = jsonMapper.readValue(json, FireDepartment.class);
-
-    Assert.assertEquals(schema.getDataSchema().getDataSource(), newSchema.getDataSchema().getDataSource());
-    Assert.assertEquals("/tmp/nonexistent", schema.getTuningConfig().getBasePersistDirectory().toString());
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/RealtimeMetricsMonitorTest.java b/server/src/test/java/org/apache/druid/segment/realtime/RealtimeMetricsMonitorTest.java
deleted file mode 100644
index cca07bc9708..00000000000
--- a/server/src/test/java/org/apache/druid/segment/realtime/RealtimeMetricsMonitorTest.java
+++ /dev/null
@@ -1,107 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime;
-
-import org.apache.druid.jackson.DefaultObjectMapper;
-import org.apache.druid.java.util.metrics.StubServiceEmitter;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeIOConfig;
-import org.junit.Before;
-import org.junit.Test;
-
-import java.util.Collections;
-import java.util.Random;
-
-public class RealtimeMetricsMonitorTest
-{
-
-  private StubServiceEmitter emitter;
-  private Random random;
-
-  @Before
-  public void setup()
-  {
-    random = new Random(100);
-    emitter = new StubServiceEmitter("test", "localhost");
-  }
-
-  @Test
-  public void testDoMonitor()
-  {
-    FireDepartment fireDepartment = new FireDepartment(
-        new DataSchema("wiki", null, null, null, null, null, null, new DefaultObjectMapper()),
-        new RealtimeIOConfig(null, null),
-        null
-    );
-
-    // Add some metrics and invoke monitoring
-    final FireDepartmentMetrics metrics = fireDepartment.getMetrics();
-    invokeRandomTimes(metrics::incrementThrownAway);
-    invokeRandomTimes(metrics::incrementUnparseable);
-    invokeRandomTimes(metrics::incrementProcessed);
-    invokeRandomTimes(metrics::incrementDedup);
-    invokeRandomTimes(metrics::incrementFailedHandoffs);
-    invokeRandomTimes(metrics::incrementFailedPersists);
-    invokeRandomTimes(metrics::incrementHandOffCount);
-    invokeRandomTimes(metrics::incrementNumPersists);
-
-    metrics.incrementPushedRows(random.nextInt());
-    metrics.incrementRowOutputCount(random.nextInt());
-    metrics.incrementMergedRows(random.nextInt());
-    metrics.incrementMergeCpuTime(random.nextInt());
-    metrics.setSinkCount(random.nextInt());
-
-    RealtimeMetricsMonitor monitor = new RealtimeMetricsMonitor(Collections.singletonList(fireDepartment));
-    monitor.doMonitor(emitter);
-
-    // Verify the metrics
-    emitter.verifyValue("ingest/events/thrownAway", metrics.thrownAway());
-    emitter.verifyValue("ingest/events/unparseable", metrics.unparseable());
-
-    emitter.verifyValue("ingest/events/duplicate", metrics.dedup());
-    emitter.verifyValue("ingest/events/processed", metrics.processed());
-    emitter.verifyValue("ingest/rows/output", metrics.rowOutput());
-    emitter.verifyValue("ingest/persists/count", metrics.numPersists());
-    emitter.verifyValue("ingest/persists/time", metrics.persistTimeMillis());
-    emitter.verifyValue("ingest/persists/cpu", metrics.persistCpuTime());
-    emitter.verifyValue("ingest/persists/backPressure", metrics.persistBackPressureMillis());
-    emitter.verifyValue("ingest/persists/failed", metrics.failedPersists());
-    emitter.verifyValue("ingest/handoff/failed", metrics.failedHandoffs());
-    emitter.verifyValue("ingest/merge/time", metrics.mergeTimeMillis());
-    emitter.verifyValue("ingest/merge/cpu", metrics.mergeCpuTime());
-    emitter.verifyValue("ingest/handoff/count", metrics.handOffCount());
-    emitter.verifyValue("ingest/sink/count", metrics.sinkCount());
-  }
-
-  private void invokeRandomTimes(Action action)
-  {
-    int limit = random.nextInt(20);
-    for (int i = 0; i < limit; ++i) {
-      action.perform();
-    }
-  }
-
-  @FunctionalInterface
-  private interface Action
-  {
-    void perform();
-  }
-
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/FireDepartmentMetricsTest.java b/server/src/test/java/org/apache/druid/segment/realtime/SegmentGenerationMetricsTest.java
similarity index 85%
rename from server/src/test/java/org/apache/druid/segment/realtime/FireDepartmentMetricsTest.java
rename to server/src/test/java/org/apache/druid/segment/realtime/SegmentGenerationMetricsTest.java
index d9c1c461abe..1928c08b2ac 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/FireDepartmentMetricsTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/SegmentGenerationMetricsTest.java
@@ -23,20 +23,20 @@ import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Test;
 
-public class FireDepartmentMetricsTest
+public class SegmentGenerationMetricsTest
 {
-  private FireDepartmentMetrics metrics;
+  private SegmentGenerationMetrics metrics;
 
   @Before
   public void setup()
   {
-    metrics = new FireDepartmentMetrics();
+    metrics = new SegmentGenerationMetrics();
   }
 
   @Test
   public void testSnapshotBeforeProcessing()
   {
-    FireDepartmentMetrics snapshot = metrics.snapshot();
+    SegmentGenerationMetrics snapshot = metrics.snapshot();
     Assert.assertEquals(0L, snapshot.messageGap());
     // invalid value
     Assert.assertTrue(0 > snapshot.maxSegmentHandoffTime());
@@ -47,7 +47,7 @@ public class FireDepartmentMetricsTest
   {
     metrics.reportMessageMaxTimestamp(System.currentTimeMillis() - 20L);
     metrics.reportMaxSegmentHandoffTime(7L);
-    FireDepartmentMetrics snapshot = metrics.snapshot();
+    SegmentGenerationMetrics snapshot = metrics.snapshot();
     Assert.assertTrue(snapshot.messageGap() >= 20L);
     Assert.assertEquals(7, snapshot.maxSegmentHandoffTime());
   }
@@ -60,7 +60,7 @@ public class FireDepartmentMetricsTest
     // Should reset to invalid value
     metrics.snapshot();
     metrics.markProcessingDone();
-    FireDepartmentMetrics snapshot = metrics.snapshot();
+    SegmentGenerationMetrics snapshot = metrics.snapshot();
     // Message gap must be invalid after processing is done
     Assert.assertTrue(0 > snapshot.messageGap());
     // value must be invalid
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumberTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumberTest.java
deleted file mode 100644
index f795492819a..00000000000
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorPlumberTest.java
+++ /dev/null
@@ -1,139 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.appenderator;
-
-import org.apache.druid.data.input.InputRow;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.realtime.SegmentPublisher;
-import org.apache.druid.segment.realtime.plumber.IntervalStartVersioningPolicy;
-import org.apache.druid.segment.realtime.plumber.NoopRejectionPolicyFactory;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-import org.easymock.EasyMock;
-import org.junit.Assert;
-import org.junit.Before;
-import org.junit.Rule;
-import org.junit.Test;
-import org.junit.rules.TemporaryFolder;
-
-public class AppenderatorPlumberTest
-{
-  private AppenderatorPlumber plumber;
-  private StreamAppenderatorTester streamAppenderatorTester;
-
-  @Rule
-  public TemporaryFolder temporaryFolder = new TemporaryFolder();
-
-  @Before
-  public void setUp() throws Exception
-  {
-    this.streamAppenderatorTester =
-        new StreamAppenderatorTester.Builder()
-            .maxRowsInMemory(10)
-            .basePersistDirectory(temporaryFolder.newFolder())
-            .build();
-    DataSegmentAnnouncer segmentAnnouncer = EasyMock
-        .createMock(DataSegmentAnnouncer.class);
-    segmentAnnouncer.announceSegment(EasyMock.anyObject());
-    EasyMock.expectLastCall().anyTimes();
-
-    SegmentPublisher segmentPublisher = EasyMock
-        .createNiceMock(SegmentPublisher.class);
-    SegmentHandoffNotifierFactory handoffNotifierFactory = EasyMock
-        .createNiceMock(SegmentHandoffNotifierFactory.class);
-    SegmentHandoffNotifier handoffNotifier = EasyMock
-        .createNiceMock(SegmentHandoffNotifier.class);
-    EasyMock
-        .expect(
-            handoffNotifierFactory.createSegmentHandoffNotifier(EasyMock
-                .anyString())).andReturn(handoffNotifier).anyTimes();
-    EasyMock
-        .expect(
-            handoffNotifier.registerSegmentHandoffCallback(
-                EasyMock.anyObject(),
-                EasyMock.anyObject(),
-                EasyMock.anyObject())).andReturn(true).anyTimes();
-
-    RealtimeTuningConfig tuningConfig = new RealtimeTuningConfig(
-        null,
-        1,
-        null,
-        null,
-        null,
-        null,
-        temporaryFolder.newFolder(),
-        new IntervalStartVersioningPolicy(),
-        new NoopRejectionPolicyFactory(),
-        null,
-        null,
-        null,
-        null,
-        0,
-        0,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-
-    this.plumber = new AppenderatorPlumber(streamAppenderatorTester.getSchema(),
-                                           tuningConfig, streamAppenderatorTester.getMetrics(),
-                                           segmentAnnouncer, segmentPublisher, handoffNotifier,
-                                           streamAppenderatorTester.getAppenderator());
-  }
-
-  @Test
-  public void testSimpleIngestion() throws Exception
-  {
-    Appenderator appenderator = streamAppenderatorTester.getAppenderator();
-
-    // startJob
-    Assert.assertEquals(null, plumber.startJob());
-
-    // getDataSource
-    Assert.assertEquals(StreamAppenderatorTester.DATASOURCE, appenderator.getDataSource());
-
-    InputRow[] rows = new InputRow[] {
-        StreamAppenderatorTest.ir("2000", "foo", 1),
-        StreamAppenderatorTest.ir("2000", "bar", 2), StreamAppenderatorTest.ir("2000", "qux", 4)};
-    // add
-    Assert.assertEquals(1, plumber.add(rows[0], null).getRowCount());
-
-    Assert.assertEquals(2, plumber.add(rows[1], null).getRowCount());
-
-    Assert.assertEquals(3, plumber.add(rows[2], null).getRowCount());
-
-    
-    Assert.assertEquals(1, plumber.getSegmentsView().size());
-    
-    SegmentIdWithShardSpec si = plumber.getSegmentsView().values().toArray(new SegmentIdWithShardSpec[0])[0];
-    
-    Assert.assertEquals(3, appenderator.getRowCount(si));
-
-    appenderator.clear();    
-    Assert.assertTrue(appenderator.getSegments().isEmpty());
-    
-    plumber.dropSegment(si);
-    plumber.finishJob();
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorsTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorsTest.java
new file mode 100644
index 00000000000..66b2281d33c
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorsTest.java
@@ -0,0 +1,245 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment.realtime.appenderator;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+import org.apache.druid.data.input.impl.DimensionsSpec;
+import org.apache.druid.data.input.impl.JSONParseSpec;
+import org.apache.druid.data.input.impl.MapInputRowParser;
+import org.apache.druid.data.input.impl.TimestampSpec;
+import org.apache.druid.jackson.DefaultObjectMapper;
+import org.apache.druid.java.util.common.FileUtils;
+import org.apache.druid.java.util.common.granularity.Granularities;
+import org.apache.druid.java.util.emitter.EmittingLogger;
+import org.apache.druid.java.util.emitter.core.NoopEmitter;
+import org.apache.druid.java.util.emitter.service.ServiceEmitter;
+import org.apache.druid.query.aggregation.AggregatorFactory;
+import org.apache.druid.query.aggregation.CountAggregatorFactory;
+import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
+import org.apache.druid.segment.IndexIO;
+import org.apache.druid.segment.IndexMerger;
+import org.apache.druid.segment.IndexMergerV9;
+import org.apache.druid.segment.IndexSpec;
+import org.apache.druid.segment.column.ColumnConfig;
+import org.apache.druid.segment.incremental.ParseExceptionHandler;
+import org.apache.druid.segment.incremental.RowIngestionMeters;
+import org.apache.druid.segment.incremental.SimpleRowIngestionMeters;
+import org.apache.druid.segment.indexing.DataSchema;
+import org.apache.druid.segment.indexing.TuningConfig;
+import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
+import org.apache.druid.segment.loading.NoopDataSegmentPusher;
+import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
+import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
+import org.apache.druid.timeline.partition.LinearShardSpec;
+import org.junit.Assert;
+import org.junit.Test;
+
+import javax.annotation.Nullable;
+import java.io.File;
+import java.util.Map;
+
+
+public class AppenderatorsTest
+{
+  @Test
+  public void testOpenSegmentsOfflineAppenderator() throws Exception
+  {
+    try (final AppenderatorTester tester = new AppenderatorTester("OPEN_SEGMENTS")) {
+      Assert.assertTrue(tester.appenderator instanceof AppenderatorImpl);
+      AppenderatorImpl appenderator = (AppenderatorImpl) tester.appenderator;
+      Assert.assertTrue(appenderator.isOpenSegments());
+    }
+  }
+
+  @Test
+  public void testClosedSegmentsOfflineAppenderator() throws Exception
+  {
+    try (final AppenderatorTester tester = new AppenderatorTester("CLOSED_SEGMENTS")) {
+      Assert.assertTrue(tester.appenderator instanceof AppenderatorImpl);
+      AppenderatorImpl appenderator = (AppenderatorImpl) tester.appenderator;
+      Assert.assertFalse(appenderator.isOpenSegments());
+    }
+  }
+
+  @Test
+  public void testClosedSegmentsSinksOfflineAppenderator() throws Exception
+  {
+    try (final AppenderatorTester tester = new AppenderatorTester("CLOSED_SEGMENTS_SINKS")) {
+      Assert.assertTrue(tester.appenderator instanceof BatchAppenderator);
+    }
+  }
+
+  private static class AppenderatorTester implements AutoCloseable
+  {
+    public static final String DATASOURCE = "foo";
+
+    private final AppenderatorConfig tuningConfig;
+    private final Appenderator appenderator;
+    private final ServiceEmitter emitter;
+
+    public AppenderatorTester(final String batchMode)
+    {
+      this(100, 100, null, new SimpleRowIngestionMeters(), false, batchMode);
+    }
+
+    public AppenderatorTester(
+        final int maxRowsInMemory,
+        final long maxSizeInBytes,
+        @Nullable final File basePersistDirectory,
+        final RowIngestionMeters rowIngestionMeters,
+        final boolean skipBytesInMemoryOverheadCheck,
+        String batchMode
+    )
+    {
+      ObjectMapper objectMapper = new DefaultObjectMapper();
+      objectMapper.registerSubtypes(LinearShardSpec.class);
+
+      final Map<String, Object> parserMap = objectMapper.convertValue(
+          new MapInputRowParser(
+              new JSONParseSpec(
+                  new TimestampSpec("ts", "auto", null),
+                  DimensionsSpec.EMPTY,
+                  null,
+                  null,
+                  null
+              )
+          ),
+          Map.class
+      );
+
+      DataSchema schema = new DataSchema(
+          DATASOURCE,
+          null,
+          null,
+          new AggregatorFactory[]{
+              new CountAggregatorFactory("count"),
+              new LongSumAggregatorFactory("met", "met")
+          },
+          new UniformGranularitySpec(Granularities.MINUTE, Granularities.NONE, null),
+          null,
+          parserMap,
+          objectMapper
+      );
+
+      tuningConfig = new TestAppenderatorConfig(
+          TuningConfig.DEFAULT_APPENDABLE_INDEX,
+          maxRowsInMemory,
+          maxSizeInBytes == 0L ? getDefaultMaxBytesInMemory() : maxSizeInBytes,
+          skipBytesInMemoryOverheadCheck,
+          IndexSpec.DEFAULT,
+          0,
+          false,
+          0L,
+          OffHeapMemorySegmentWriteOutMediumFactory.instance(),
+          IndexMerger.UNLIMITED_MAX_COLUMNS_TO_MERGE,
+          basePersistDirectory == null ? createNewBasePersistDirectory() : basePersistDirectory
+      );
+      SegmentGenerationMetrics metrics = new SegmentGenerationMetrics();
+
+      IndexIO indexIO = new IndexIO(objectMapper, ColumnConfig.DEFAULT);
+      IndexMergerV9 indexMerger = new IndexMergerV9(
+          objectMapper,
+          indexIO,
+          OffHeapMemorySegmentWriteOutMediumFactory.instance()
+      );
+
+      emitter = new ServiceEmitter(
+          "test",
+          "test",
+          new NoopEmitter()
+      );
+      emitter.start();
+      EmittingLogger.registerEmitter(emitter);
+
+      switch (batchMode) {
+        case "OPEN_SEGMENTS":
+          appenderator = Appenderators.createOpenSegmentsOffline(
+              schema.getDataSource(),
+              schema,
+              tuningConfig,
+              metrics,
+              new NoopDataSegmentPusher(),
+              objectMapper,
+              indexIO,
+              indexMerger,
+              rowIngestionMeters,
+              new ParseExceptionHandler(rowIngestionMeters, false, Integer.MAX_VALUE, 0),
+              false,
+              CentralizedDatasourceSchemaConfig.create()
+          );
+          break;
+        case "CLOSED_SEGMENTS":
+          appenderator = Appenderators.createClosedSegmentsOffline(
+              schema.getDataSource(),
+              schema,
+              tuningConfig,
+              metrics,
+              new NoopDataSegmentPusher(),
+              objectMapper,
+              indexIO,
+              indexMerger,
+              rowIngestionMeters,
+              new ParseExceptionHandler(rowIngestionMeters, false, Integer.MAX_VALUE, 0),
+              false,
+              CentralizedDatasourceSchemaConfig.create()
+          );
+
+          break;
+        case "CLOSED_SEGMENTS_SINKS":
+          appenderator = Appenderators.createOffline(
+              schema.getDataSource(),
+              schema,
+              tuningConfig,
+              metrics,
+              new NoopDataSegmentPusher(),
+              objectMapper,
+              indexIO,
+              indexMerger,
+              rowIngestionMeters,
+              new ParseExceptionHandler(rowIngestionMeters, false, Integer.MAX_VALUE, 0),
+              false,
+              CentralizedDatasourceSchemaConfig.create()
+          );
+          break;
+        default:
+          throw new IllegalArgumentException("Unrecognized batchMode: " + batchMode);
+      }
+    }
+
+    private long getDefaultMaxBytesInMemory()
+    {
+      return (Runtime.getRuntime().totalMemory()) / 3;
+    }
+
+    @Override
+    public void close() throws Exception
+    {
+      appenderator.close();
+      emitter.close();
+      FileUtils.deleteDirectory(tuningConfig.getBasePersistDirectory());
+    }
+
+    private static File createNewBasePersistDirectory()
+    {
+      return FileUtils.createTempDir("druid-batch-persist");
+    }
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/ClosedSegmensSinksBatchAppenderatorTester.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/ClosedSegmensSinksBatchAppenderatorTester.java
index f5ae98dd6a0..cf2d7f79898 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/ClosedSegmensSinksBatchAppenderatorTester.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/ClosedSegmensSinksBatchAppenderatorTester.java
@@ -24,7 +24,6 @@ import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.data.input.impl.JSONParseSpec;
 import org.apache.druid.data.input.impl.MapInputRowParser;
 import org.apache.druid.data.input.impl.TimestampSpec;
-import org.apache.druid.indexer.partitions.PartitionsSpec;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.FileUtils;
 import org.apache.druid.java.util.common.granularity.Granularities;
@@ -39,7 +38,6 @@ import org.apache.druid.segment.IndexMerger;
 import org.apache.druid.segment.IndexMergerV9;
 import org.apache.druid.segment.IndexSpec;
 import org.apache.druid.segment.column.ColumnConfig;
-import org.apache.druid.segment.incremental.AppendableIndexSpec;
 import org.apache.druid.segment.incremental.ParseExceptionHandler;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
 import org.apache.druid.segment.incremental.SimpleRowIngestionMeters;
@@ -48,12 +46,10 @@ import org.apache.druid.segment.indexing.TuningConfig;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
-import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.partition.LinearShardSpec;
-import org.joda.time.Period;
 
 import javax.annotation.Nullable;
 import java.io.File;
@@ -61,7 +57,6 @@ import java.io.IOException;
 import java.net.URI;
 import java.util.List;
 import java.util.Map;
-import java.util.Objects;
 import java.util.concurrent.CopyOnWriteArrayList;
 
 public class ClosedSegmensSinksBatchAppenderatorTester implements AutoCloseable
@@ -70,7 +65,7 @@ public class ClosedSegmensSinksBatchAppenderatorTester implements AutoCloseable
 
   private final DataSchema schema;
   private final AppenderatorConfig tuningConfig;
-  private final FireDepartmentMetrics metrics;
+  private final SegmentGenerationMetrics metrics;
   private final ObjectMapper objectMapper;
   private final Appenderator appenderator;
   private final ServiceEmitter emitter;
@@ -170,7 +165,7 @@ public class ClosedSegmensSinksBatchAppenderatorTester implements AutoCloseable
         objectMapper
     );
 
-    tuningConfig = new TestIndexTuningConfig(
+    tuningConfig = new TestAppenderatorConfig(
         TuningConfig.DEFAULT_APPENDABLE_INDEX,
         maxRowsInMemory,
         maxSizeInBytes == 0L ? getDefaultMaxBytesInMemory() : maxSizeInBytes,
@@ -181,10 +176,9 @@ public class ClosedSegmensSinksBatchAppenderatorTester implements AutoCloseable
         0L,
         OffHeapMemorySegmentWriteOutMediumFactory.instance(),
         IndexMerger.UNLIMITED_MAX_COLUMNS_TO_MERGE,
-        basePersistDirectory == null ? createNewBasePersistDirectory() : basePersistDirectory,
-        null
+        basePersistDirectory == null ? createNewBasePersistDirectory() : basePersistDirectory
     );
-    metrics = new FireDepartmentMetrics();
+    metrics = new SegmentGenerationMetrics();
 
     IndexIO indexIO = new IndexIO(objectMapper, ColumnConfig.DEFAULT);
     IndexMergerV9 indexMerger = new IndexMergerV9(
@@ -267,7 +261,7 @@ public class ClosedSegmensSinksBatchAppenderatorTester implements AutoCloseable
     return tuningConfig;
   }
 
-  public FireDepartmentMetrics getMetrics()
+  public SegmentGenerationMetrics getMetrics()
   {
     return metrics;
   }
@@ -299,216 +293,4 @@ public class ClosedSegmensSinksBatchAppenderatorTester implements AutoCloseable
   {
     return FileUtils.createTempDir("druid-batch-persist");
   }
-
-
-  static class TestIndexTuningConfig implements AppenderatorConfig
-  {
-    private final AppendableIndexSpec appendableIndexSpec;
-    private final int maxRowsInMemory;
-    private final long maxBytesInMemory;
-    private final boolean skipBytesInMemoryOverheadCheck;
-    private final int maxColumnsToMerge;
-    private final PartitionsSpec partitionsSpec;
-    private final IndexSpec indexSpec;
-    private final File basePersistDirectory;
-    private final int maxPendingPersists;
-    private final boolean reportParseExceptions;
-    private final long pushTimeout;
-    private final IndexSpec indexSpecForIntermediatePersists;
-    @Nullable
-    private final SegmentWriteOutMediumFactory segmentWriteOutMediumFactory;
-    private final int numPersistThreads;
-
-    public TestIndexTuningConfig(
-         AppendableIndexSpec appendableIndexSpec,
-         Integer maxRowsInMemory,
-         Long maxBytesInMemory,
-         Boolean skipBytesInMemoryOverheadCheck,
-         IndexSpec indexSpec,
-         Integer maxPendingPersists,
-         Boolean reportParseExceptions,
-         Long pushTimeout,
-         @Nullable SegmentWriteOutMediumFactory segmentWriteOutMediumFactory,
-         Integer maxColumnsToMerge,
-         File basePersistDirectory,
-         @Nullable Integer numPersistThreads
-    )
-    {
-      this.appendableIndexSpec = appendableIndexSpec;
-      this.maxRowsInMemory = maxRowsInMemory;
-      this.maxBytesInMemory = maxBytesInMemory;
-      this.skipBytesInMemoryOverheadCheck = skipBytesInMemoryOverheadCheck;
-      this.indexSpec = indexSpec;
-      this.maxPendingPersists = maxPendingPersists;
-      this.reportParseExceptions = reportParseExceptions;
-      this.pushTimeout = pushTimeout;
-      this.segmentWriteOutMediumFactory = segmentWriteOutMediumFactory;
-      this.maxColumnsToMerge = maxColumnsToMerge;
-      this.basePersistDirectory = basePersistDirectory;
-
-      this.partitionsSpec = null;
-      this.indexSpecForIntermediatePersists = this.indexSpec;
-      this.numPersistThreads = numPersistThreads == null ? DEFAULT_NUM_PERSIST_THREADS : numPersistThreads;
-    }
-
-    @Override
-    public TestIndexTuningConfig withBasePersistDirectory(File dir)
-    {
-      throw new UnsupportedOperationException();
-    }
-
-    @Override
-    public AppendableIndexSpec getAppendableIndexSpec()
-    {
-      return appendableIndexSpec;
-    }
-    
-    @Override
-    public int getMaxRowsInMemory()
-    {
-      return maxRowsInMemory;
-    }
-    
-    @Override
-    public long getMaxBytesInMemory()
-    {
-      return maxBytesInMemory;
-    }
-    
-    @Override
-    public boolean isSkipBytesInMemoryOverheadCheck()
-    {
-      return skipBytesInMemoryOverheadCheck;
-    }
-    
-    @Nullable
-    @Override
-    public PartitionsSpec getPartitionsSpec()
-    {
-      return partitionsSpec;
-    }
-
-    @Override
-    public IndexSpec getIndexSpec()
-    {
-      return indexSpec;
-    }
-    
-    @Override
-    public IndexSpec getIndexSpecForIntermediatePersists()
-    {
-      return indexSpecForIntermediatePersists;
-    }
-    
-    @Override
-    public int getMaxPendingPersists()
-    {
-      return maxPendingPersists;
-    }
-
-    @Override
-    public boolean isReportParseExceptions()
-    {
-      return reportParseExceptions;
-    }
-
-    @Nullable
-    @Override
-    public SegmentWriteOutMediumFactory getSegmentWriteOutMediumFactory()
-    {
-      return segmentWriteOutMediumFactory;
-    }
-
-    @Override
-    public int getMaxColumnsToMerge()
-    {
-      return maxColumnsToMerge;
-    }
-
-    @Override
-    public File getBasePersistDirectory()
-    {
-      return basePersistDirectory;
-    }
-
-    @Override
-    public Period getIntermediatePersistPeriod()
-    {
-      return new Period(Integer.MAX_VALUE); // intermediate persist doesn't make much sense for batch jobs
-    }
-
-    @Override
-    public int getNumPersistThreads()
-    {
-      return numPersistThreads;
-    }
-    
-    @Override
-    public boolean equals(Object o)
-    {
-      if (this == o) {
-        return true;
-      }
-      if (o == null || getClass() != o.getClass()) {
-        return false;
-      }
-      TestIndexTuningConfig that = (TestIndexTuningConfig) o;
-      return Objects.equals(appendableIndexSpec, that.appendableIndexSpec) &&
-             maxRowsInMemory == that.maxRowsInMemory &&
-             maxBytesInMemory == that.maxBytesInMemory &&
-             skipBytesInMemoryOverheadCheck == that.skipBytesInMemoryOverheadCheck &&
-             maxColumnsToMerge == that.maxColumnsToMerge &&
-             maxPendingPersists == that.maxPendingPersists &&
-             reportParseExceptions == that.reportParseExceptions &&
-             pushTimeout == that.pushTimeout &&
-             numPersistThreads == that.numPersistThreads &&
-             Objects.equals(partitionsSpec, that.partitionsSpec) &&
-             Objects.equals(indexSpec, that.indexSpec) &&
-             Objects.equals(indexSpecForIntermediatePersists, that.indexSpecForIntermediatePersists) &&
-             Objects.equals(basePersistDirectory, that.basePersistDirectory) &&
-             Objects.equals(segmentWriteOutMediumFactory, that.segmentWriteOutMediumFactory);
-    }
-
-    @Override
-    public int hashCode()
-    {
-      return Objects.hash(
-          appendableIndexSpec,
-          maxRowsInMemory,
-          maxBytesInMemory,
-          skipBytesInMemoryOverheadCheck,
-          maxColumnsToMerge,
-          partitionsSpec,
-          indexSpec,
-          indexSpecForIntermediatePersists,
-          basePersistDirectory,
-          maxPendingPersists,
-          reportParseExceptions,
-          pushTimeout,
-          segmentWriteOutMediumFactory,
-          numPersistThreads
-      );
-    }
-
-    @Override
-    public String toString()
-    {
-      return "IndexTuningConfig{" +
-             "maxRowsInMemory=" + maxRowsInMemory +
-             ", maxBytesInMemory=" + maxBytesInMemory +
-             ", skipBytesInMemoryOverheadCheck=" + skipBytesInMemoryOverheadCheck +
-             ", maxColumnsToMerge=" + maxColumnsToMerge +
-             ", partitionsSpec=" + partitionsSpec +
-             ", indexSpec=" + indexSpec +
-             ", indexSpecForIntermediatePersists=" + indexSpecForIntermediatePersists +
-             ", basePersistDirectory=" + basePersistDirectory +
-             ", maxPendingPersists=" + maxPendingPersists +
-             ", reportParseExceptions=" + reportParseExceptions +
-             ", pushTimeout=" + pushTimeout +
-             ", segmentWriteOutMediumFactory=" + segmentWriteOutMediumFactory +
-             ", numPersistThreads=" + numPersistThreads +
-             '}';
-    }
-  }
-
 }
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/DefaultOfflineAppenderatorFactoryTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/DefaultOfflineAppenderatorFactoryTest.java
deleted file mode 100644
index 97578426812..00000000000
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/DefaultOfflineAppenderatorFactoryTest.java
+++ /dev/null
@@ -1,179 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.appenderator;
-
-import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.collect.ImmutableList;
-import com.google.inject.Binder;
-import com.google.inject.Injector;
-import com.google.inject.Module;
-import com.google.inject.name.Names;
-import org.apache.druid.data.input.impl.DimensionsSpec;
-import org.apache.druid.data.input.impl.JSONParseSpec;
-import org.apache.druid.data.input.impl.MapInputRowParser;
-import org.apache.druid.data.input.impl.TimestampSpec;
-import org.apache.druid.guice.GuiceInjectors;
-import org.apache.druid.initialization.Initialization;
-import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.java.util.common.granularity.Granularities;
-import org.apache.druid.query.DruidProcessingConfig;
-import org.apache.druid.query.aggregation.AggregatorFactory;
-import org.apache.druid.query.aggregation.CountAggregatorFactory;
-import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
-import org.apache.druid.segment.column.ColumnConfig;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.timeline.partition.LinearShardSpec;
-import org.junit.Assert;
-import org.junit.Rule;
-import org.junit.Test;
-import org.junit.rules.TemporaryFolder;
-
-import java.io.IOException;
-import java.util.Map;
-
-public class DefaultOfflineAppenderatorFactoryTest
-{
-  @Rule
-  public TemporaryFolder temporaryFolder = new TemporaryFolder();
-
-  @Test
-  public void testBuild() throws IOException, SegmentNotWritableException
-  {
-    Injector injector = Initialization.makeInjectorWithModules(
-        GuiceInjectors.makeStartupInjector(),
-        ImmutableList.<Module>of(
-            new Module()
-            {
-              @Override
-              public void configure(Binder binder)
-              {
-                binder.bindConstant().annotatedWith(Names.named("serviceName")).to("druid/tool");
-                binder.bindConstant().annotatedWith(Names.named("servicePort")).to(9999);
-                binder.bindConstant().annotatedWith(Names.named("tlsServicePort")).to(-1);
-                binder.bind(DruidProcessingConfig.class).toInstance(
-                    new DruidProcessingConfig()
-                    {
-                      @Override
-                      public String getFormatString()
-                      {
-                        return "processing-%s";
-                      }
-
-                      @Override
-                      public int intermediateComputeSizeBytes()
-                      {
-                        return 100 * 1024 * 1024;
-                      }
-
-                      @Override
-                      public int getNumThreads()
-                      {
-                        return 1;
-                      }
-
-                    }
-                );
-                binder.bind(ColumnConfig.class).to(DruidProcessingConfig.class);
-              }
-            }
-        )
-    );
-    ObjectMapper objectMapper = injector.getInstance(ObjectMapper.class);
-    AppenderatorFactory defaultOfflineAppenderatorFactory = objectMapper.readerFor(AppenderatorFactory.class)
-                                                                        .readValue("{\"type\":\"offline\"}");
-
-    final Map<String, Object> parserMap = objectMapper.convertValue(
-        new MapInputRowParser(
-            new JSONParseSpec(
-                new TimestampSpec("ts", "auto", null),
-                DimensionsSpec.EMPTY,
-                null,
-                null,
-                null
-            )
-        ),
-        Map.class
-    );
-    DataSchema schema = new DataSchema(
-        "dataSourceName",
-        parserMap,
-        new AggregatorFactory[]{
-            new CountAggregatorFactory("count"),
-            new LongSumAggregatorFactory("met", "met")
-        },
-        new UniformGranularitySpec(Granularities.MINUTE, Granularities.NONE, null),
-        null,
-        objectMapper
-    );
-
-    RealtimeTuningConfig tuningConfig = new RealtimeTuningConfig(
-        null,
-        75000,
-        null,
-        null,
-        null,
-        null,
-        temporaryFolder.newFolder(),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        0,
-        0,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-
-    Appenderator appenderator = defaultOfflineAppenderatorFactory.build(
-        schema,
-        tuningConfig,
-        new FireDepartmentMetrics()
-    );
-    try {
-      Assert.assertEquals("dataSourceName", appenderator.getDataSource());
-      Assert.assertEquals(null, appenderator.startJob());
-      SegmentIdWithShardSpec identifier = new SegmentIdWithShardSpec(
-          "dataSourceName",
-          Intervals.of("2000/2001"),
-          "A",
-          new LinearShardSpec(0)
-      );
-      Assert.assertEquals(0, ((AppenderatorImpl) appenderator).getRowsInMemory());
-      appenderator.add(identifier, StreamAppenderatorTest.ir("2000", "bar", 1), null);
-      Assert.assertEquals(1, ((AppenderatorImpl) appenderator).getRowsInMemory());
-      appenderator.add(identifier, StreamAppenderatorTest.ir("2000", "baz", 1), null);
-      Assert.assertEquals(2, ((AppenderatorImpl) appenderator).getRowsInMemory());
-      appenderator.close();
-      Assert.assertEquals(0, ((AppenderatorImpl) appenderator).getRowsInMemory());
-    }
-    finally {
-      appenderator.close();
-    }
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/OpenAndClosedSegmentsAppenderatorTester.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/OpenAndClosedSegmentsAppenderatorTester.java
index 0d210f21a2c..33a0ed2f8a4 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/OpenAndClosedSegmentsAppenderatorTester.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/OpenAndClosedSegmentsAppenderatorTester.java
@@ -46,7 +46,7 @@ import org.apache.druid.segment.indexing.TuningConfig;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.partition.LinearShardSpec;
@@ -63,7 +63,7 @@ public class OpenAndClosedSegmentsAppenderatorTester implements AutoCloseable
   public static final String DATASOURCE = "foo";
 
   private final DataSchema schema;
-  private final FireDepartmentMetrics metrics;
+  private final SegmentGenerationMetrics metrics;
   private final DataSegmentPusher dataSegmentPusher;
   private final ObjectMapper objectMapper;
   private final Appenderator appenderator;
@@ -139,23 +139,21 @@ public class OpenAndClosedSegmentsAppenderatorTester implements AutoCloseable
         null,
         objectMapper
     );
-    tuningConfig =
-        new ClosedSegmensSinksBatchAppenderatorTester.TestIndexTuningConfig(
-            TuningConfig.DEFAULT_APPENDABLE_INDEX,
-            maxRowsInMemory,
-            maxSizeInBytes == 0L ? getDefaultMaxBytesInMemory() : maxSizeInBytes,
-            skipBytesInMemoryOverheadCheck,
-            IndexSpec.DEFAULT,
-            0,
-            false,
-            0L,
-            OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-            IndexMerger.UNLIMITED_MAX_COLUMNS_TO_MERGE,
-            basePersistDirectory == null ? createNewBasePersistDirectory() : basePersistDirectory,
-            null
-        );
+    tuningConfig = new TestAppenderatorConfig(
+        TuningConfig.DEFAULT_APPENDABLE_INDEX,
+        maxRowsInMemory,
+        maxSizeInBytes == 0L ? getDefaultMaxBytesInMemory() : maxSizeInBytes,
+        skipBytesInMemoryOverheadCheck,
+        IndexSpec.DEFAULT,
+        0,
+        false,
+        0L,
+        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
+        IndexMerger.UNLIMITED_MAX_COLUMNS_TO_MERGE,
+        basePersistDirectory == null ? createNewBasePersistDirectory() : basePersistDirectory
+    );
 
-    metrics = new FireDepartmentMetrics();
+    metrics = new SegmentGenerationMetrics();
 
     indexIO = new IndexIO(
         objectMapper,
@@ -251,7 +249,7 @@ public class OpenAndClosedSegmentsAppenderatorTester implements AutoCloseable
     return tuningConfig;
   }
 
-  public FireDepartmentMetrics getMetrics()
+  public SegmentGenerationMetrics getMetrics()
   {
     return metrics;
   }
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java
index e3ed8fd49d7..bdc6f64c90a 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java
@@ -41,7 +41,7 @@ import org.apache.druid.query.Query;
 import org.apache.druid.query.QueryRunner;
 import org.apache.druid.query.SegmentDescriptor;
 import org.apache.druid.segment.loading.DataSegmentKiller;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.realtime.appenderator.StreamAppenderatorDriverTest.TestCommitterSupplier;
 import org.apache.druid.segment.realtime.appenderator.StreamAppenderatorDriverTest.TestSegmentAllocator;
 import org.apache.druid.segment.realtime.appenderator.StreamAppenderatorDriverTest.TestSegmentHandoffNotifierFactory;
@@ -136,7 +136,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
         new NoopUsedSegmentChecker(),
         dataSegmentKiller,
         OBJECT_MAPPER,
-        new FireDepartmentMetrics()
+        new SegmentGenerationMetrics()
     );
 
     driver.startJob(null);
@@ -174,7 +174,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
         new NoopUsedSegmentChecker(),
         dataSegmentKiller,
         OBJECT_MAPPER,
-        new FireDepartmentMetrics()
+        new SegmentGenerationMetrics()
     );
 
     driver.startJob(null);
@@ -212,7 +212,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
         new NoopUsedSegmentChecker(),
         dataSegmentKiller,
         OBJECT_MAPPER,
-        new FireDepartmentMetrics()
+        new SegmentGenerationMetrics()
     );
 
     driver.startJob(null);
@@ -263,7 +263,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
         new NoopUsedSegmentChecker(),
         dataSegmentKiller,
         OBJECT_MAPPER,
-        new FireDepartmentMetrics()
+        new SegmentGenerationMetrics()
     );
 
     driver.startJob(null);
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverTest.java
index 63775e2dc3b..eae1148027d 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverTest.java
@@ -41,7 +41,7 @@ import org.apache.druid.query.SegmentDescriptor;
 import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
 import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
 import org.apache.druid.segment.loading.DataSegmentKiller;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.SegmentId;
 import org.apache.druid.timeline.partition.NumberedShardSpec;
@@ -130,7 +130,7 @@ public class StreamAppenderatorDriverTest extends EasyMockSupport
         new TestUsedSegmentChecker(streamAppenderatorTester.getPushedSegments()),
         dataSegmentKiller,
         OBJECT_MAPPER,
-        new FireDepartmentMetrics()
+        new SegmentGenerationMetrics()
     );
 
     EasyMock.replay(dataSegmentKiller);
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorTest.java
index 4e057c5c897..538784a8853 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorTest.java
@@ -48,9 +48,8 @@ import org.apache.druid.query.timeseries.TimeseriesResultValue;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
 import org.apache.druid.segment.incremental.SimpleRowIngestionMeters;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.plumber.Committers;
+import org.apache.druid.segment.realtime.sink.Committers;
 import org.apache.druid.server.coordination.DataSegmentAnnouncer;
 import org.apache.druid.testing.InitializedNullHandlingTest;
 import org.apache.druid.timeline.DataSegment;
@@ -909,7 +908,7 @@ public class StreamAppenderatorTest extends InitializedNullHandlingTest
   @Test
   public void testRestoreFromDisk() throws Exception
   {
-    final RealtimeTuningConfig tuningConfig;
+    final AppenderatorConfig tuningConfig;
     try (
         final StreamAppenderatorTester tester =
             new StreamAppenderatorTester.Builder().maxRowsInMemory(2)
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorTester.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorTester.java
index da4a76f1a10..2a39718667c 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorTester.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorTester.java
@@ -53,18 +53,20 @@ import org.apache.druid.query.timeseries.TimeseriesQueryEngine;
 import org.apache.druid.query.timeseries.TimeseriesQueryQueryToolChest;
 import org.apache.druid.query.timeseries.TimeseriesQueryRunnerFactory;
 import org.apache.druid.segment.IndexIO;
+import org.apache.druid.segment.IndexMerger;
 import org.apache.druid.segment.IndexMergerV9;
+import org.apache.druid.segment.IndexSpec;
 import org.apache.druid.segment.column.ColumnConfig;
 import org.apache.druid.segment.incremental.ParseExceptionHandler;
 import org.apache.druid.segment.incremental.RowIngestionMeters;
 import org.apache.druid.segment.incremental.SimpleRowIngestionMeters;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
+import org.apache.druid.segment.indexing.TuningConfig;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.loading.DataSegmentPusher;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.server.coordination.DataSegmentAnnouncer;
 import org.apache.druid.server.coordination.NoopDataSegmentAnnouncer;
@@ -84,8 +86,8 @@ public class StreamAppenderatorTester implements AutoCloseable
   public static final String DATASOURCE = "foo";
 
   private final DataSchema schema;
-  private final RealtimeTuningConfig tuningConfig;
-  private final FireDepartmentMetrics metrics;
+  private final AppenderatorConfig tuningConfig;
+  private final SegmentGenerationMetrics metrics;
   private final DataSegmentPusher dataSegmentPusher;
   private final ObjectMapper objectMapper;
   private final Appenderator appenderator;
@@ -132,31 +134,21 @@ public class StreamAppenderatorTester implements AutoCloseable
         null,
         objectMapper
     );
-    tuningConfig = new RealtimeTuningConfig(
-        null,
-        maxRowsInMemory,
-        maxSizeInBytes == 0L ? getDefaultMaxBytesInMemory() : maxSizeInBytes,
-        skipBytesInMemoryOverheadCheck,
-        null,
-        null,
-        basePersistDirectory,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        0,
-        0,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    tuningConfig = new TestAppenderatorConfig(
+      TuningConfig.DEFAULT_APPENDABLE_INDEX,
+      maxRowsInMemory,
+      maxSizeInBytes == 0L ? getDefaultMaxBytesInMemory() : maxSizeInBytes,
+      skipBytesInMemoryOverheadCheck,
+      IndexSpec.DEFAULT,
+      0,
+      false,
+      0L,
+      OffHeapMemorySegmentWriteOutMediumFactory.instance(),
+      IndexMerger.UNLIMITED_MAX_COLUMNS_TO_MERGE,
+      basePersistDirectory
+  );
 
-    metrics = new FireDepartmentMetrics();
+    metrics = new SegmentGenerationMetrics();
     queryExecutor = Execs.singleThreaded("queryExecutor(%d)");
 
     IndexIO indexIO = new IndexIO(
@@ -310,12 +302,12 @@ public class StreamAppenderatorTester implements AutoCloseable
     return schema;
   }
 
-  public RealtimeTuningConfig getTuningConfig()
+  public AppenderatorConfig getTuningConfig()
   {
     return tuningConfig;
   }
 
-  public FireDepartmentMetrics getMetrics()
+  public SegmentGenerationMetrics getMetrics()
   {
     return metrics;
   }
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestAppenderatorConfig.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestAppenderatorConfig.java
new file mode 100644
index 00000000000..5dba99de500
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestAppenderatorConfig.java
@@ -0,0 +1,228 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment.realtime.appenderator;
+
+import org.apache.druid.indexer.partitions.PartitionsSpec;
+import org.apache.druid.segment.IndexSpec;
+import org.apache.druid.segment.incremental.AppendableIndexSpec;
+import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
+import org.joda.time.Period;
+
+import javax.annotation.Nullable;
+import java.io.File;
+import java.util.Objects;
+
+public class TestAppenderatorConfig implements AppenderatorConfig
+{
+  private final AppendableIndexSpec appendableIndexSpec;
+  private final int maxRowsInMemory;
+  private final long maxBytesInMemory;
+  private final boolean skipBytesInMemoryOverheadCheck;
+  private final int maxColumnsToMerge;
+  private final PartitionsSpec partitionsSpec;
+  private final IndexSpec indexSpec;
+  private final File basePersistDirectory;
+  private final int maxPendingPersists;
+  private final boolean reportParseExceptions;
+  private final long pushTimeout;
+  private final IndexSpec indexSpecForIntermediatePersists;
+  @Nullable
+  private final SegmentWriteOutMediumFactory segmentWriteOutMediumFactory;
+
+  public TestAppenderatorConfig(
+      AppendableIndexSpec appendableIndexSpec,
+      Integer maxRowsInMemory,
+      Long maxBytesInMemory,
+      Boolean skipBytesInMemoryOverheadCheck,
+      IndexSpec indexSpec,
+      Integer maxPendingPersists,
+      Boolean reportParseExceptions,
+      Long pushTimeout,
+      @Nullable SegmentWriteOutMediumFactory segmentWriteOutMediumFactory,
+      Integer maxColumnsToMerge,
+      File basePersistDirectory
+  )
+  {
+    this.appendableIndexSpec = appendableIndexSpec;
+    this.maxRowsInMemory = maxRowsInMemory;
+    this.maxBytesInMemory = maxBytesInMemory;
+    this.skipBytesInMemoryOverheadCheck = skipBytesInMemoryOverheadCheck;
+    this.indexSpec = indexSpec;
+    this.maxPendingPersists = maxPendingPersists;
+    this.reportParseExceptions = reportParseExceptions;
+    this.pushTimeout = pushTimeout;
+    this.segmentWriteOutMediumFactory = segmentWriteOutMediumFactory;
+    this.maxColumnsToMerge = maxColumnsToMerge;
+    this.basePersistDirectory = basePersistDirectory;
+
+    this.partitionsSpec = null;
+    this.indexSpecForIntermediatePersists = this.indexSpec;
+  }
+
+  @Override
+  public TestAppenderatorConfig withBasePersistDirectory(File dir)
+  {
+    throw new UnsupportedOperationException();
+  }
+
+  @Override
+  public AppendableIndexSpec getAppendableIndexSpec()
+  {
+    return appendableIndexSpec;
+  }
+
+  @Override
+  public int getMaxRowsInMemory()
+  {
+    return maxRowsInMemory;
+  }
+
+  @Override
+  public long getMaxBytesInMemory()
+  {
+    return maxBytesInMemory;
+  }
+
+  @Override
+  public boolean isSkipBytesInMemoryOverheadCheck()
+  {
+    return skipBytesInMemoryOverheadCheck;
+  }
+
+  @Nullable
+  @Override
+  public PartitionsSpec getPartitionsSpec()
+  {
+    return partitionsSpec;
+  }
+
+  @Override
+  public IndexSpec getIndexSpec()
+  {
+    return indexSpec;
+  }
+
+  @Override
+  public IndexSpec getIndexSpecForIntermediatePersists()
+  {
+    return indexSpecForIntermediatePersists;
+  }
+
+  @Override
+  public int getMaxPendingPersists()
+  {
+    return maxPendingPersists;
+  }
+
+  @Override
+  public boolean isReportParseExceptions()
+  {
+    return reportParseExceptions;
+  }
+
+  @Nullable
+  @Override
+  public SegmentWriteOutMediumFactory getSegmentWriteOutMediumFactory()
+  {
+    return segmentWriteOutMediumFactory;
+  }
+
+  @Override
+  public int getMaxColumnsToMerge()
+  {
+    return maxColumnsToMerge;
+  }
+
+  @Override
+  public File getBasePersistDirectory()
+  {
+    return basePersistDirectory;
+  }
+
+  @Override
+  public Period getIntermediatePersistPeriod()
+  {
+    return new Period(Integer.MAX_VALUE); // intermediate persist doesn't make much sense for batch jobs
+  }
+
+  @Override
+  public boolean equals(Object o)
+  {
+    if (this == o) {
+      return true;
+    }
+    if (o == null || getClass() != o.getClass()) {
+      return false;
+    }
+    TestAppenderatorConfig that = (TestAppenderatorConfig) o;
+    return Objects.equals(appendableIndexSpec, that.appendableIndexSpec) &&
+           maxRowsInMemory == that.maxRowsInMemory &&
+           maxBytesInMemory == that.maxBytesInMemory &&
+           skipBytesInMemoryOverheadCheck == that.skipBytesInMemoryOverheadCheck &&
+           maxColumnsToMerge == that.maxColumnsToMerge &&
+           maxPendingPersists == that.maxPendingPersists &&
+           reportParseExceptions == that.reportParseExceptions &&
+           pushTimeout == that.pushTimeout &&
+           Objects.equals(partitionsSpec, that.partitionsSpec) &&
+           Objects.equals(indexSpec, that.indexSpec) &&
+           Objects.equals(indexSpecForIntermediatePersists, that.indexSpecForIntermediatePersists) &&
+           Objects.equals(basePersistDirectory, that.basePersistDirectory) &&
+           Objects.equals(segmentWriteOutMediumFactory, that.segmentWriteOutMediumFactory);
+  }
+
+  @Override
+  public int hashCode()
+  {
+    return Objects.hash(
+        appendableIndexSpec,
+        maxRowsInMemory,
+        maxBytesInMemory,
+        skipBytesInMemoryOverheadCheck,
+        maxColumnsToMerge,
+        partitionsSpec,
+        indexSpec,
+        indexSpecForIntermediatePersists,
+        basePersistDirectory,
+        maxPendingPersists,
+        reportParseExceptions,
+        pushTimeout,
+        segmentWriteOutMediumFactory
+    );
+  }
+
+  @Override
+  public String toString()
+  {
+    return "TestAppenderatorConfig{" +
+           "maxRowsInMemory=" + maxRowsInMemory +
+           ", maxBytesInMemory=" + maxBytesInMemory +
+           ", skipBytesInMemoryOverheadCheck=" + skipBytesInMemoryOverheadCheck +
+           ", maxColumnsToMerge=" + maxColumnsToMerge +
+           ", partitionsSpec=" + partitionsSpec +
+           ", indexSpec=" + indexSpec +
+           ", indexSpecForIntermediatePersists=" + indexSpecForIntermediatePersists +
+           ", basePersistDirectory=" + basePersistDirectory +
+           ", maxPendingPersists=" + maxPendingPersists +
+           ", reportParseExceptions=" + reportParseExceptions +
+           ", pushTimeout=" + pushTimeout +
+           ", segmentWriteOutMediumFactory=" + segmentWriteOutMediumFactory +
+           '}';
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/UnifiedIndexerAppenderatorsManagerTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/UnifiedIndexerAppenderatorsManagerTest.java
index ce77db1d7cf..9bf629931b5 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/UnifiedIndexerAppenderatorsManagerTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/UnifiedIndexerAppenderatorsManagerTest.java
@@ -49,7 +49,7 @@ import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.join.JoinableFactoryWrapperTest;
 import org.apache.druid.segment.loading.NoopDataSegmentPusher;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
+import org.apache.druid.segment.realtime.SegmentGenerationMetrics;
 import org.apache.druid.segment.writeout.OnHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
 import org.apache.druid.server.metrics.NoopServiceEmitter;
@@ -107,7 +107,7 @@ public class UnifiedIndexerAppenderatorsManagerTest extends InitializedNullHandl
             null
         ),
         appenderatorConfig,
-        new FireDepartmentMetrics(),
+        new SegmentGenerationMetrics(),
         new NoopDataSegmentPusher(),
         TestHelper.makeJsonMapper(),
         TestHelper.getTestIndexIO(),
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/plumber/CustomVersioningPolicyTest.java b/server/src/test/java/org/apache/druid/segment/realtime/plumber/CustomVersioningPolicyTest.java
deleted file mode 100644
index f145b0e1d79..00000000000
--- a/server/src/test/java/org/apache/druid/segment/realtime/plumber/CustomVersioningPolicyTest.java
+++ /dev/null
@@ -1,50 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.databind.ObjectMapper;
-import org.apache.druid.segment.TestHelper;
-import org.joda.time.DateTime;
-import org.joda.time.DateTimeZone;
-import org.joda.time.Interval;
-import org.junit.Assert;
-import org.junit.Test;
-
-public class CustomVersioningPolicyTest
-{
-
-  @Test
-  public void testSerialization() throws Exception
-  {
-    Interval interval = new Interval(DateTime.now(DateTimeZone.UTC), DateTime.now(DateTimeZone.UTC));
-    String version = "someversion";
-
-    CustomVersioningPolicy policy = new CustomVersioningPolicy(version);
-
-    final ObjectMapper mapper = TestHelper.makeJsonMapper();
-    CustomVersioningPolicy serialized = mapper.readValue(
-        mapper.writeValueAsBytes(policy),
-        CustomVersioningPolicy.class
-    );
-
-    Assert.assertEquals(version, policy.getVersion(interval));
-    Assert.assertEquals(version, serialized.getVersion(interval));
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/plumber/IntervalStartVersioningPolicyTest.java b/server/src/test/java/org/apache/druid/segment/realtime/plumber/IntervalStartVersioningPolicyTest.java
deleted file mode 100644
index 15c05fd9c56..00000000000
--- a/server/src/test/java/org/apache/druid/segment/realtime/plumber/IntervalStartVersioningPolicyTest.java
+++ /dev/null
@@ -1,37 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import org.apache.druid.java.util.common.Intervals;
-import org.junit.Assert;
-import org.junit.Test;
-
-/**
- */
-public class IntervalStartVersioningPolicyTest
-{
-  @Test
-  public void testGetVersion()
-  {
-    IntervalStartVersioningPolicy policy = new IntervalStartVersioningPolicy();
-    String version = policy.getVersion(Intervals.of("2013-01-01/2013-01-02"));
-    Assert.assertEquals("2013-01-01T00:00:00.000Z", version);
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/plumber/MessageTimeRejectionPolicyFactoryTest.java b/server/src/test/java/org/apache/druid/segment/realtime/plumber/MessageTimeRejectionPolicyFactoryTest.java
deleted file mode 100644
index 36e73dc60bc..00000000000
--- a/server/src/test/java/org/apache/druid/segment/realtime/plumber/MessageTimeRejectionPolicyFactoryTest.java
+++ /dev/null
@@ -1,47 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import org.apache.druid.java.util.common.DateTimes;
-import org.joda.time.DateTime;
-import org.joda.time.Period;
-import org.junit.Assert;
-import org.junit.Test;
-
-/**
- */
-public class MessageTimeRejectionPolicyFactoryTest
-{
-  @Test
-  public void testAccept()
-  {
-    Period period = new Period("PT10M");
-    RejectionPolicy rejectionPolicy = new MessageTimeRejectionPolicyFactory().create(period);
-
-    DateTime now = DateTimes.nowUtc();
-    DateTime past = now.minus(period).minus(1);
-    DateTime future = now.plus(period).plus(1);
-
-    Assert.assertTrue(rejectionPolicy.accept(now.getMillis()));
-    Assert.assertFalse(rejectionPolicy.accept(past.getMillis()));
-    Assert.assertTrue(rejectionPolicy.accept(future.getMillis()));
-    Assert.assertFalse(rejectionPolicy.accept(now.getMillis()));
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/plumber/RealtimePlumberSchoolTest.java b/server/src/test/java/org/apache/druid/segment/realtime/plumber/RealtimePlumberSchoolTest.java
deleted file mode 100644
index 74a1217ed27..00000000000
--- a/server/src/test/java/org/apache/druid/segment/realtime/plumber/RealtimePlumberSchoolTest.java
+++ /dev/null
@@ -1,714 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.base.Supplier;
-import com.google.common.base.Suppliers;
-import com.google.common.collect.ImmutableList;
-import com.google.common.collect.Lists;
-import org.apache.druid.client.cache.CachePopulatorStats;
-import org.apache.druid.client.cache.MapCache;
-import org.apache.druid.data.input.Committer;
-import org.apache.druid.data.input.InputRow;
-import org.apache.druid.data.input.Row;
-import org.apache.druid.data.input.impl.DimensionsSpec;
-import org.apache.druid.data.input.impl.JSONParseSpec;
-import org.apache.druid.data.input.impl.StringInputRowParser;
-import org.apache.druid.data.input.impl.TimestampSpec;
-import org.apache.druid.jackson.DefaultObjectMapper;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.FileUtils;
-import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.java.util.common.granularity.Granularities;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.query.DefaultQueryRunnerFactoryConglomerate;
-import org.apache.druid.query.DirectQueryProcessingPool;
-import org.apache.druid.query.aggregation.AggregatorFactory;
-import org.apache.druid.query.aggregation.CountAggregatorFactory;
-import org.apache.druid.segment.QueryableIndex;
-import org.apache.druid.segment.ReferenceCountingSegment;
-import org.apache.druid.segment.TestHelper;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifier;
-import org.apache.druid.segment.handoff.SegmentHandoffNotifierFactory;
-import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
-import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.apache.druid.segment.join.NoopJoinableFactory;
-import org.apache.druid.segment.loading.DataSegmentPusher;
-import org.apache.druid.segment.realtime.FireDepartmentMetrics;
-import org.apache.druid.segment.realtime.FireDepartmentTest;
-import org.apache.druid.segment.realtime.FireHydrant;
-import org.apache.druid.segment.realtime.SegmentPublisher;
-import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
-import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
-import org.apache.druid.segment.writeout.TmpFileSegmentWriteOutMediumFactory;
-import org.apache.druid.server.coordination.DataSegmentAnnouncer;
-import org.apache.druid.testing.InitializedNullHandlingTest;
-import org.easymock.EasyMock;
-import org.joda.time.DateTime;
-import org.joda.time.Interval;
-import org.junit.After;
-import org.junit.Assert;
-import org.junit.Before;
-import org.junit.Rule;
-import org.junit.Test;
-import org.junit.rules.TemporaryFolder;
-import org.junit.runner.RunWith;
-import org.junit.runners.Parameterized;
-
-import java.io.File;
-import java.util.ArrayList;
-import java.util.Collection;
-import java.util.HashMap;
-import java.util.List;
-import java.util.Map;
-import java.util.concurrent.CountDownLatch;
-import java.util.concurrent.TimeUnit;
-
-/**
- *
- */
-@RunWith(Parameterized.class)
-public class RealtimePlumberSchoolTest extends InitializedNullHandlingTest
-{
-  @Parameterized.Parameters(name = "rejectionPolicy = {0}, segmentWriteOutMediumFactory = {1}")
-  public static Collection<?> constructorFeeder()
-  {
-    final RejectionPolicyFactory[] rejectionPolicies = new RejectionPolicyFactory[]{
-        new NoopRejectionPolicyFactory(),
-        new MessageTimeRejectionPolicyFactory()
-    };
-
-    final List<Object[]> constructors = new ArrayList<>();
-    for (RejectionPolicyFactory rejectionPolicy : rejectionPolicies) {
-      constructors.add(new Object[]{rejectionPolicy, OffHeapMemorySegmentWriteOutMediumFactory.instance()});
-      constructors.add(new Object[]{rejectionPolicy, TmpFileSegmentWriteOutMediumFactory.instance()});
-    }
-    return constructors;
-  }
-
-  private final RejectionPolicyFactory rejectionPolicy;
-  private final SegmentWriteOutMediumFactory segmentWriteOutMediumFactory;
-  private RealtimePlumber plumber;
-  private RealtimePlumberSchool realtimePlumberSchool;
-  private DataSegmentAnnouncer announcer;
-  private SegmentPublisher segmentPublisher;
-  private DataSegmentPusher dataSegmentPusher;
-  private SegmentHandoffNotifier handoffNotifier;
-  private SegmentHandoffNotifierFactory handoffNotifierFactory;
-  private ServiceEmitter emitter;
-  private RealtimeTuningConfig tuningConfig;
-  private DataSchema schema;
-  private DataSchema schema2;
-  private FireDepartmentMetrics metrics;
-  private File tmpDir;
-
-  @Rule
-  public TemporaryFolder temporaryFolder = new TemporaryFolder();
-
-  public RealtimePlumberSchoolTest(
-      RejectionPolicyFactory rejectionPolicy,
-      SegmentWriteOutMediumFactory segmentWriteOutMediumFactory
-  )
-  {
-    this.rejectionPolicy = rejectionPolicy;
-    this.segmentWriteOutMediumFactory = segmentWriteOutMediumFactory;
-  }
-
-  @Before
-  public void setUp() throws Exception
-  {
-    tmpDir = FileUtils.createTempDir();
-
-    ObjectMapper jsonMapper = new DefaultObjectMapper();
-
-    schema = new DataSchema(
-        "test",
-        jsonMapper.convertValue(
-            new StringInputRowParser(
-                new JSONParseSpec(
-                    new TimestampSpec("timestamp", "auto", null),
-                    DimensionsSpec.EMPTY,
-                    null,
-                    null,
-                    null
-                ),
-                null
-            ),
-            Map.class
-        ),
-        new AggregatorFactory[]{new CountAggregatorFactory("rows")},
-        new UniformGranularitySpec(Granularities.HOUR, Granularities.NONE, null),
-        null,
-        jsonMapper
-    );
-
-    schema2 = new DataSchema(
-        "test",
-        jsonMapper.convertValue(
-            new StringInputRowParser(
-                new JSONParseSpec(
-                    new TimestampSpec("timestamp", "auto", null),
-                    DimensionsSpec.EMPTY,
-                    null,
-                    null,
-                    null
-                ),
-                null
-            ),
-            Map.class
-        ),
-        new AggregatorFactory[]{new CountAggregatorFactory("rows")},
-        new UniformGranularitySpec(Granularities.YEAR, Granularities.NONE, null),
-        null,
-        jsonMapper
-    );
-
-    announcer = EasyMock.createMock(DataSegmentAnnouncer.class);
-    announcer.announceSegment(EasyMock.anyObject());
-    EasyMock.expectLastCall().anyTimes();
-
-    segmentPublisher = EasyMock.createNiceMock(SegmentPublisher.class);
-    dataSegmentPusher = EasyMock.createNiceMock(DataSegmentPusher.class);
-    handoffNotifierFactory = EasyMock.createNiceMock(SegmentHandoffNotifierFactory.class);
-    handoffNotifier = EasyMock.createNiceMock(SegmentHandoffNotifier.class);
-    EasyMock.expect(handoffNotifierFactory.createSegmentHandoffNotifier(EasyMock.anyString()))
-            .andReturn(handoffNotifier)
-            .anyTimes();
-    EasyMock.expect(
-        handoffNotifier.registerSegmentHandoffCallback(
-            EasyMock.anyObject(),
-            EasyMock.anyObject(),
-            EasyMock.anyObject()
-        )
-    ).andReturn(true).anyTimes();
-
-    emitter = EasyMock.createMock(ServiceEmitter.class);
-
-    EasyMock.replay(announcer, segmentPublisher, dataSegmentPusher, handoffNotifierFactory, handoffNotifier, emitter);
-
-    tuningConfig = new RealtimeTuningConfig(
-        null,
-        1,
-        null,
-        null,
-        null,
-        null,
-        temporaryFolder.newFolder(),
-        new IntervalStartVersioningPolicy(),
-        rejectionPolicy,
-        null,
-        null,
-        null,
-        null,
-        0,
-        0,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-
-    realtimePlumberSchool = new RealtimePlumberSchool(
-        emitter,
-        new DefaultQueryRunnerFactoryConglomerate(new HashMap<>()),
-        dataSegmentPusher,
-        announcer,
-        segmentPublisher,
-        handoffNotifierFactory,
-        DirectQueryProcessingPool.INSTANCE,
-        NoopJoinableFactory.INSTANCE,
-        TestHelper.getTestIndexMergerV9(segmentWriteOutMediumFactory),
-        TestHelper.getTestIndexIO(),
-        MapCache.create(0),
-        FireDepartmentTest.NO_CACHE_CONFIG,
-        new CachePopulatorStats(),
-        TestHelper.makeJsonMapper()
-    );
-
-    metrics = new FireDepartmentMetrics();
-    plumber = (RealtimePlumber) realtimePlumberSchool.findPlumber(schema, tuningConfig, metrics);
-  }
-
-  @After
-  public void tearDown() throws Exception
-  {
-    EasyMock.verify(announcer, segmentPublisher, dataSegmentPusher, handoffNotifierFactory, handoffNotifier, emitter);
-    FileUtils.deleteDirectory(
-        new File(
-            tuningConfig.getBasePersistDirectory(),
-            schema.getDataSource()
-        )
-    );
-    FileUtils.deleteDirectory(tmpDir);
-  }
-
-  @Test(timeout = 60_000L)
-  public void testPersist() throws Exception
-  {
-    testPersist(null);
-  }
-
-  @Test(timeout = 60_000L)
-  public void testPersistWithCommitMetadata() throws Exception
-  {
-    final Object commitMetadata = "dummyCommitMetadata";
-    testPersist(commitMetadata);
-
-    plumber = (RealtimePlumber) realtimePlumberSchool.findPlumber(schema, tuningConfig, metrics);
-    Assert.assertEquals(commitMetadata, plumber.startJob());
-  }
-
-  private void testPersist(final Object commitMetadata) throws Exception
-  {
-    Sink sink = new Sink(
-        Intervals.utc(0, TimeUnit.HOURS.toMillis(1)),
-        schema,
-        tuningConfig.getShardSpec(),
-        DateTimes.of("2014-12-01T12:34:56.789").toString(),
-        tuningConfig.getAppendableIndexSpec(),
-        tuningConfig.getMaxRowsInMemory(),
-        tuningConfig.getMaxBytesInMemoryOrDefault(),
-        true,
-        tuningConfig.getDedupColumn()
-    );
-    plumber.getSinks().put(0L, sink);
-    Assert.assertNull(plumber.startJob());
-
-    final InputRow row = EasyMock.createNiceMock(InputRow.class);
-    EasyMock.expect(row.getTimestampFromEpoch()).andReturn(0L);
-    EasyMock.expect(row.getDimensions()).andReturn(new ArrayList<String>());
-    EasyMock.replay(row);
-
-    final CountDownLatch doneSignal = new CountDownLatch(1);
-
-    final Committer committer = new Committer()
-    {
-      @Override
-      public Object getMetadata()
-      {
-        return commitMetadata;
-      }
-
-      @Override
-      public void run()
-      {
-        doneSignal.countDown();
-      }
-    };
-    plumber.add(row, Suppliers.ofInstance(committer));
-    plumber.persist(committer);
-
-    doneSignal.await();
-
-    plumber.getSinks().clear();
-    plumber.finishJob();
-  }
-
-  @Test(timeout = 60_000L)
-  public void testPersistFails() throws Exception
-  {
-    Sink sink = new Sink(
-        Intervals.utc(0, TimeUnit.HOURS.toMillis(1)),
-        schema,
-        tuningConfig.getShardSpec(),
-        DateTimes.of("2014-12-01T12:34:56.789").toString(),
-        tuningConfig.getAppendableIndexSpec(),
-        tuningConfig.getMaxRowsInMemory(),
-        tuningConfig.getMaxBytesInMemoryOrDefault(),
-        true,
-        tuningConfig.getDedupColumn()
-    );
-    plumber.getSinks().put(0L, sink);
-    plumber.startJob();
-    final InputRow row = EasyMock.createNiceMock(InputRow.class);
-    EasyMock.expect(row.getTimestampFromEpoch()).andReturn(0L);
-    EasyMock.expect(row.getDimensions()).andReturn(new ArrayList<String>());
-    EasyMock.replay(row);
-    plumber.add(row, Suppliers.ofInstance(Committers.nil()));
-
-    final CountDownLatch doneSignal = new CountDownLatch(1);
-
-    plumber.persist(
-        supplierFromRunnable(
-            () -> {
-              doneSignal.countDown();
-              throw new RuntimeException();
-            }
-        ).get()
-    );
-
-    doneSignal.await();
-
-    // Exception may need time to propagate
-    while (metrics.failedPersists() < 1) {
-      Thread.sleep(100);
-    }
-
-    Assert.assertEquals(1, metrics.failedPersists());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testPersistHydrantGaps() throws Exception
-  {
-    final Object commitMetadata = "dummyCommitMetadata";
-    testPersistHydrantGapsHelper(commitMetadata);
-  }
-
-  private void testPersistHydrantGapsHelper(final Object commitMetadata) throws Exception
-  {
-    Interval testInterval = new Interval(DateTimes.of("1970-01-01"), DateTimes.of("1971-01-01"));
-
-    RealtimePlumber plumber2 = (RealtimePlumber) realtimePlumberSchool.findPlumber(schema2, tuningConfig, metrics);
-    Sink sink = new Sink(
-        testInterval,
-        schema2,
-        tuningConfig.getShardSpec(),
-        DateTimes.of("2014-12-01T12:34:56.789").toString(),
-        tuningConfig.getAppendableIndexSpec(),
-        tuningConfig.getMaxRowsInMemory(),
-        tuningConfig.getMaxBytesInMemoryOrDefault(),
-        true,
-        tuningConfig.getDedupColumn()
-    );
-    plumber2.getSinks().put(0L, sink);
-    Assert.assertNull(plumber2.startJob());
-    final CountDownLatch doneSignal = new CountDownLatch(1);
-    final Committer committer = new Committer()
-    {
-      @Override
-      public Object getMetadata()
-      {
-        return commitMetadata;
-      }
-
-      @Override
-      public void run()
-      {
-        doneSignal.countDown();
-      }
-    };
-    plumber2.add(getTestInputRow("1970-01-01"), Suppliers.ofInstance(committer));
-    plumber2.add(getTestInputRow("1970-02-01"), Suppliers.ofInstance(committer));
-    plumber2.add(getTestInputRow("1970-03-01"), Suppliers.ofInstance(committer));
-    plumber2.add(getTestInputRow("1970-04-01"), Suppliers.ofInstance(committer));
-    plumber2.add(getTestInputRow("1970-05-01"), Suppliers.ofInstance(committer));
-
-    plumber2.persist(committer);
-
-    doneSignal.await();
-    plumber2.getSinks().clear();
-    plumber2.finishJob();
-
-    File persistDir = plumber2.computePersistDir(schema2, testInterval);
-
-    /* Check that all hydrants were persisted */
-    for (int i = 0; i < 5; i++) {
-      Assert.assertTrue(new File(persistDir, String.valueOf(i)).exists());
-    }
-
-    /* Create some gaps in the persisted hydrants and reload */
-    FileUtils.deleteDirectory(new File(persistDir, "1"));
-    FileUtils.deleteDirectory(new File(persistDir, "3"));
-    RealtimePlumber restoredPlumber = (RealtimePlumber) realtimePlumberSchool.findPlumber(
-        schema2,
-        tuningConfig,
-        metrics
-    );
-    restoredPlumber.bootstrapSinksFromDisk();
-
-    Map<Long, Sink> sinks = restoredPlumber.getSinks();
-    Assert.assertEquals(1, sinks.size());
-
-
-    List<FireHydrant> hydrants = Lists.newArrayList(sinks.get(new Long(0)));
-    DateTime startTime = DateTimes.of("1970-01-01T00:00:00.000Z");
-    Interval expectedInterval = new Interval(startTime, DateTimes.of("1971-01-01T00:00:00.000Z"));
-    Assert.assertEquals(0, hydrants.get(0).getCount());
-    Assert.assertEquals(
-        expectedInterval,
-        hydrants.get(0).getSegmentDataInterval()
-    );
-    Assert.assertEquals(2, hydrants.get(1).getCount());
-    Assert.assertEquals(
-        expectedInterval,
-        hydrants.get(1).getSegmentDataInterval()
-    );
-    Assert.assertEquals(4, hydrants.get(2).getCount());
-    Assert.assertEquals(
-        expectedInterval,
-        hydrants.get(2).getSegmentDataInterval()
-    );
-
-    /* Delete all the hydrants and reload, no sink should be created */
-    FileUtils.deleteDirectory(new File(persistDir, "0"));
-    FileUtils.deleteDirectory(new File(persistDir, "2"));
-    FileUtils.deleteDirectory(new File(persistDir, "4"));
-    RealtimePlumber restoredPlumber2 = (RealtimePlumber) realtimePlumberSchool.findPlumber(
-        schema2,
-        tuningConfig,
-        metrics
-    );
-    restoredPlumber2.bootstrapSinksFromDisk();
-
-    Assert.assertEquals(0, restoredPlumber2.getSinks().size());
-  }
-
-  @Test(timeout = 60_000L)
-  public void testDimOrderInheritance() throws Exception
-  {
-    final Object commitMetadata = "dummyCommitMetadata";
-    testDimOrderInheritanceHelper(commitMetadata);
-  }
-
-  private void testDimOrderInheritanceHelper(final Object commitMetadata) throws Exception
-  {
-    List<List<String>> expectedDims = ImmutableList.of(
-        ImmutableList.of("dimD"),
-        ImmutableList.of("dimC"),
-        ImmutableList.of("dimA"),
-        ImmutableList.of("dimB"),
-        ImmutableList.of("dimE"),
-        ImmutableList.of("dimD", "dimC", "dimA", "dimB", "dimE")
-    );
-
-    QueryableIndex qindex;
-    FireHydrant hydrant;
-    Map<Long, Sink> sinks;
-
-    RealtimePlumber plumber = (RealtimePlumber) realtimePlumberSchool.findPlumber(schema2, tuningConfig, metrics);
-    Assert.assertNull(plumber.startJob());
-
-    final CountDownLatch doneSignal = new CountDownLatch(1);
-
-    final Committer committer = new Committer()
-    {
-      @Override
-      public Object getMetadata()
-      {
-        return commitMetadata;
-      }
-
-      @Override
-      public void run()
-      {
-        doneSignal.countDown();
-      }
-    };
-
-    plumber.add(
-        getTestInputRowFull(
-            "1970-01-01",
-            ImmutableList.of("dimD"),
-            ImmutableList.of("1")
-        ),
-        Suppliers.ofInstance(committer)
-    );
-    plumber.add(
-        getTestInputRowFull(
-            "1970-01-01",
-            ImmutableList.of("dimC"),
-            ImmutableList.of("1")
-        ),
-        Suppliers.ofInstance(committer)
-    );
-    plumber.add(
-        getTestInputRowFull(
-            "1970-01-01",
-            ImmutableList.of("dimA"),
-            ImmutableList.of("1")
-        ),
-        Suppliers.ofInstance(committer)
-    );
-    plumber.add(
-        getTestInputRowFull(
-            "1970-01-01",
-            ImmutableList.of("dimB"),
-            ImmutableList.of("1")
-        ),
-        Suppliers.ofInstance(committer)
-    );
-    plumber.add(
-        getTestInputRowFull(
-            "1970-01-01",
-            ImmutableList.of("dimE"),
-            ImmutableList.of("1")
-        ),
-        Suppliers.ofInstance(committer)
-    );
-    plumber.add(
-        getTestInputRowFull(
-            "1970-01-01",
-            ImmutableList.of("dimA", "dimB", "dimC", "dimD", "dimE"),
-            ImmutableList.of("1")
-        ),
-        Suppliers.ofInstance(committer)
-    );
-
-    plumber.persist(committer);
-
-    doneSignal.await();
-
-    plumber.getSinks().clear();
-    plumber.finishJob();
-
-    RealtimePlumber restoredPlumber = (RealtimePlumber) realtimePlumberSchool.findPlumber(
-        schema2,
-        tuningConfig,
-        metrics
-    );
-    restoredPlumber.bootstrapSinksFromDisk();
-
-    sinks = restoredPlumber.getSinks();
-    Assert.assertEquals(1, sinks.size());
-    List<FireHydrant> hydrants = Lists.newArrayList(sinks.get(0L));
-
-    for (int i = 0; i < hydrants.size(); i++) {
-      hydrant = hydrants.get(i);
-      ReferenceCountingSegment segment = hydrant.getIncrementedSegment();
-      try {
-        qindex = segment.asQueryableIndex();
-        Assert.assertEquals(i, hydrant.getCount());
-        Assert.assertEquals(expectedDims.get(i), ImmutableList.copyOf(qindex.getAvailableDimensions()));
-      }
-      finally {
-        segment.decrement();
-      }
-    }
-  }
-
-  private InputRow getTestInputRow(final String timeStr)
-  {
-    return new InputRow()
-    {
-      @Override
-      public List<String> getDimensions()
-      {
-        return new ArrayList<>();
-      }
-
-      @Override
-      public long getTimestampFromEpoch()
-      {
-        return DateTimes.of(timeStr).getMillis();
-      }
-
-      @Override
-      public DateTime getTimestamp()
-      {
-        return DateTimes.of(timeStr);
-      }
-
-      @Override
-      public List<String> getDimension(String dimension)
-      {
-        return new ArrayList<>();
-      }
-
-      @Override
-      public Number getMetric(String metric)
-      {
-        return 0;
-      }
-
-      @Override
-      public Object getRaw(String dimension)
-      {
-        return null;
-      }
-
-      @Override
-      public int compareTo(Row o)
-      {
-        return 0;
-      }
-    };
-  }
-
-  private InputRow getTestInputRowFull(final String timeStr, final List<String> dims, final List<String> dimVals)
-  {
-    return new InputRow()
-    {
-      @Override
-      public List<String> getDimensions()
-      {
-        return dims;
-      }
-
-      @Override
-      public long getTimestampFromEpoch()
-      {
-        return DateTimes.of(timeStr).getMillis();
-      }
-
-      @Override
-      public DateTime getTimestamp()
-      {
-        return DateTimes.of(timeStr);
-      }
-
-      @Override
-      public List<String> getDimension(String dimension)
-      {
-        return dimVals;
-      }
-
-      @Override
-      public Number getMetric(String metric)
-      {
-        return 0;
-      }
-
-      @Override
-      public Object getRaw(String dimension)
-      {
-        return dimVals;
-      }
-
-      @Override
-      public int compareTo(Row o)
-      {
-        return 0;
-      }
-    };
-  }
-
-  private static Supplier<Committer> supplierFromRunnable(final Runnable runnable)
-  {
-    final Committer committer = new Committer()
-    {
-      @Override
-      public Object getMetadata()
-      {
-        return null;
-      }
-
-      @Override
-      public void run()
-      {
-        runnable.run();
-      }
-    };
-    return Suppliers.ofInstance(committer);
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/plumber/ServerTimeRejectionPolicyFactoryTest.java b/server/src/test/java/org/apache/druid/segment/realtime/plumber/ServerTimeRejectionPolicyFactoryTest.java
deleted file mode 100644
index 496788e030e..00000000000
--- a/server/src/test/java/org/apache/druid/segment/realtime/plumber/ServerTimeRejectionPolicyFactoryTest.java
+++ /dev/null
@@ -1,47 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.segment.realtime.plumber;
-
-import org.apache.druid.java.util.common.DateTimes;
-import org.joda.time.DateTime;
-import org.joda.time.Period;
-import org.junit.Assert;
-import org.junit.Test;
-
-/**
- */
-public class ServerTimeRejectionPolicyFactoryTest
-{
-  @Test
-  public void testAccept()
-  {
-    Period period = new Period("PT10M");
-
-    RejectionPolicy rejectionPolicy = new ServerTimeRejectionPolicyFactory().create(period);
-
-    DateTime now = DateTimes.nowUtc();
-    DateTime past = now.minus(period).minus(100);
-    DateTime future = now.plus(period).plus(100);
-
-    Assert.assertTrue(rejectionPolicy.accept(now.getMillis()));
-    Assert.assertFalse(rejectionPolicy.accept(past.getMillis()));
-    Assert.assertFalse(rejectionPolicy.accept(future.getMillis()));
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/plumber/SinkTest.java b/server/src/test/java/org/apache/druid/segment/realtime/sink/SinkTest.java
similarity index 74%
rename from server/src/test/java/org/apache/druid/segment/realtime/plumber/SinkTest.java
rename to server/src/test/java/org/apache/druid/segment/realtime/sink/SinkTest.java
index 0d3c9c23bff..9d85ec6c8e6 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/plumber/SinkTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/sink/SinkTest.java
@@ -17,7 +17,7 @@
  * under the License.
  */
 
-package org.apache.druid.segment.realtime.plumber;
+package org.apache.druid.segment.realtime.sink;
 
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
@@ -43,16 +43,17 @@ import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.segment.incremental.IncrementalIndex;
 import org.apache.druid.segment.incremental.IndexSizeExceededException;
 import org.apache.druid.segment.indexing.DataSchema;
-import org.apache.druid.segment.indexing.RealtimeTuningConfig;
+import org.apache.druid.segment.indexing.TuningConfig;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.realtime.FireHydrant;
 import org.apache.druid.testing.InitializedNullHandlingTest;
 import org.apache.druid.timeline.SegmentId;
+import org.apache.druid.timeline.partition.NumberedShardSpec;
+import org.apache.druid.timeline.partition.ShardSpec;
 import org.apache.druid.utils.CloseableUtils;
 import org.easymock.EasyMock;
 import org.joda.time.DateTime;
 import org.joda.time.Interval;
-import org.joda.time.Period;
 import org.junit.Assert;
 import org.junit.Test;
 
@@ -69,6 +70,9 @@ import java.util.function.Function;
  */
 public class SinkTest extends InitializedNullHandlingTest
 {
+  private static final ShardSpec SHARD_SPEC = new NumberedShardSpec(0, 1);
+  private static final int MAX_ROWS_IN_MEMORY = 100;
+
   @Test
   public void testSwap() throws Exception
   {
@@ -83,39 +87,15 @@ public class SinkTest extends InitializedNullHandlingTest
 
     final Interval interval = Intervals.of("2013-01-01/2013-01-02");
     final String version = DateTimes.nowUtc().toString();
-    RealtimeTuningConfig tuningConfig = new RealtimeTuningConfig(
-        null,
-        100,
-        null,
-        null,
-        new Period("P1Y"),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        0,
-        0,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
     final Sink sink = new Sink(
         interval,
         schema,
-        tuningConfig.getShardSpec(),
+        SHARD_SPEC,
         version,
-        tuningConfig.getAppendableIndexSpec(),
-        tuningConfig.getMaxRowsInMemory(),
-        tuningConfig.getMaxBytesInMemoryOrDefault(),
-        true,
-        tuningConfig.getDedupColumn()
+        TuningConfig.DEFAULT_APPENDABLE_INDEX,
+        MAX_ROWS_IN_MEMORY,
+        TuningConfig.DEFAULT_APPENDABLE_INDEX.getDefaultMaxBytesInMemory(),
+        true
     );
 
     sink.add(
@@ -227,93 +207,6 @@ public class SinkTest extends InitializedNullHandlingTest
     Assert.assertEquals(2, Iterators.size(sink.iterator()));
   }
 
-  @Test
-  public void testDedup() throws Exception
-  {
-    final DataSchema schema = new DataSchema(
-        "test",
-        new TimestampSpec(null, null, null),
-        DimensionsSpec.EMPTY,
-        new AggregatorFactory[]{new CountAggregatorFactory("rows")},
-        new UniformGranularitySpec(Granularities.HOUR, Granularities.MINUTE, null),
-        null
-    );
-
-    final Interval interval = Intervals.of("2013-01-01/2013-01-02");
-    final String version = DateTimes.nowUtc().toString();
-    RealtimeTuningConfig tuningConfig = new RealtimeTuningConfig(
-        null,
-        100,
-        null,
-        null,
-        new Period("P1Y"),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        0,
-        0,
-        null,
-        null,
-        null,
-        null,
-        "dedupColumn",
-        null
-    );
-    final Sink sink = new Sink(
-        interval,
-        schema,
-        tuningConfig.getShardSpec(),
-        version,
-        tuningConfig.getAppendableIndexSpec(),
-        tuningConfig.getMaxRowsInMemory(),
-        tuningConfig.getMaxBytesInMemoryOrDefault(),
-        true,
-        tuningConfig.getDedupColumn()
-    );
-
-    int rows = sink.add(new MapBasedInputRow(
-        DateTimes.of("2013-01-01"),
-        ImmutableList.of("field", "dedupColumn"),
-        ImmutableMap.of("field1", "value1", "dedupColumn", "v1")
-    ), false).getRowCount();
-    Assert.assertTrue(rows > 0);
-
-    // dedupColumn is null
-    rows = sink.add(new MapBasedInputRow(
-        DateTimes.of("2013-01-01"),
-        ImmutableList.of("field", "dedupColumn"),
-        ImmutableMap.of("field1", "value2")
-    ), false).getRowCount();
-    Assert.assertTrue(rows > 0);
-
-    // dedupColumn is null
-    rows = sink.add(new MapBasedInputRow(
-        DateTimes.of("2013-01-01"),
-        ImmutableList.of("field", "dedupColumn"),
-        ImmutableMap.of("field1", "value3")
-    ), false).getRowCount();
-    Assert.assertTrue(rows > 0);
-
-    rows = sink.add(new MapBasedInputRow(
-        DateTimes.of("2013-01-01"),
-        ImmutableList.of("field", "dedupColumn"),
-        ImmutableMap.of("field1", "value4", "dedupColumn", "v2")
-    ), false).getRowCount();
-    Assert.assertTrue(rows > 0);
-
-    rows = sink.add(new MapBasedInputRow(
-        DateTimes.of("2013-01-01"),
-        ImmutableList.of("field", "dedupColumn"),
-        ImmutableMap.of("field1", "value5", "dedupColumn", "v1")
-    ), false).getRowCount();
-    Assert.assertTrue(rows == -2);
-  }
-
   @Test
   public void testAcquireSegmentReferences_empty()
   {
@@ -378,39 +271,15 @@ public class SinkTest extends InitializedNullHandlingTest
 
     final Interval interval = Intervals.of("2013-01-01/2013-01-02");
     final String version = DateTimes.nowUtc().toString();
-    RealtimeTuningConfig tuningConfig = new RealtimeTuningConfig(
-        null,
-        2,
-        null,
-        null,
-        new Period("P1Y"),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        0,
-        0,
-        null,
-        null,
-        null,
-        null,
-        "dedupColumn",
-        null
-    );
     final Sink sink = new Sink(
         interval,
         schema,
-        tuningConfig.getShardSpec(),
+        SHARD_SPEC,
         version,
-        tuningConfig.getAppendableIndexSpec(),
-        tuningConfig.getMaxRowsInMemory(),
-        tuningConfig.getMaxBytesInMemoryOrDefault(),
-        true,
-        tuningConfig.getDedupColumn()
+        TuningConfig.DEFAULT_APPENDABLE_INDEX,
+        MAX_ROWS_IN_MEMORY,
+        TuningConfig.DEFAULT_APPENDABLE_INDEX.getDefaultMaxBytesInMemory(),
+        true
     );
 
     sink.add(new MapBasedInputRow(
diff --git a/server/src/test/java/org/apache/druid/server/QueryStackTests.java b/server/src/test/java/org/apache/druid/server/QueryStackTests.java
index 7d3f58ef600..3df1d95b33a 100644
--- a/server/src/test/java/org/apache/druid/server/QueryStackTests.java
+++ b/server/src/test/java/org/apache/druid/server/QueryStackTests.java
@@ -98,7 +98,6 @@ import org.apache.druid.utils.JvmUtils;
 import org.junit.Assert;
 
 import javax.annotation.Nullable;
-
 import java.util.Collections;
 import java.util.Map;
 import java.util.Set;
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/duty/KillUnusedSegmentsTest.java b/server/src/test/java/org/apache/druid/server/coordinator/duty/KillUnusedSegmentsTest.java
index 2455610ceac..9d0f752869e 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/duty/KillUnusedSegmentsTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/duty/KillUnusedSegmentsTest.java
@@ -36,9 +36,11 @@ import org.apache.druid.java.util.common.CloseableIterators;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.parsers.CloseableIterator;
-import org.apache.druid.metadata.SQLMetadataSegmentPublisher;
+import org.apache.druid.metadata.MetadataStorageTablesConfig;
+import org.apache.druid.metadata.SQLMetadataConnector;
 import org.apache.druid.metadata.SegmentsMetadataManagerConfig;
 import org.apache.druid.metadata.SqlSegmentsMetadataManager;
+import org.apache.druid.metadata.SqlSegmentsMetadataManagerTestBase;
 import org.apache.druid.metadata.TestDerbyConnector;
 import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
@@ -98,12 +100,13 @@ public class KillUnusedSegmentsTest
   @Rule
   public final TestDerbyConnector.DerbyConnectorRule derbyConnectorRule = new TestDerbyConnector.DerbyConnectorRule();
   private SqlSegmentsMetadataManager sqlSegmentsMetadataManager;
-  private SQLMetadataSegmentPublisher publisher;
+  private SQLMetadataConnector connector;
+  private MetadataStorageTablesConfig config;
 
   @Before
   public void setup()
   {
-    final TestDerbyConnector connector = derbyConnectorRule.getConnector();
+    connector = derbyConnectorRule.getConnector();
     SegmentsMetadataManagerConfig config = new SegmentsMetadataManagerConfig();
     config.setPollDuration(Period.millis(1));
     sqlSegmentsMetadataManager = new SqlSegmentsMetadataManager(
@@ -116,11 +119,7 @@ public class KillUnusedSegmentsTest
     );
     sqlSegmentsMetadataManager.start();
 
-    publisher = new SQLMetadataSegmentPublisher(
-        TestHelper.makeJsonMapper(),
-        derbyConnectorRule.metadataTablesConfigSupplier().get(),
-        connector
-    );
+    this.config = derbyConnectorRule.metadataTablesConfigSupplier().get();
     connector.createSegmentTable();
 
     overlordClient = new TestOverlordClient();
@@ -733,7 +732,7 @@ public class KillUnusedSegmentsTest
   {
     final DataSegment segment = createSegment(dataSource, interval, version);
     try {
-      publisher.publishSegment(segment);
+      SqlSegmentsMetadataManagerTestBase.publishSegment(connector, config, TestHelper.makeJsonMapper(), segment);
     }
     catch (IOException e) {
       throw new RuntimeException(e);
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidQuery.java b/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidQuery.java
index 5bcec39a1e8..a7d534db700 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidQuery.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidQuery.java
@@ -106,7 +106,6 @@ import org.joda.time.Interval;
 
 import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
-
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.Comparator;
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidRel.java b/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidRel.java
index 798b0bb407b..8db108fbb94 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidRel.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidRel.java
@@ -31,7 +31,6 @@ import org.apache.druid.server.QueryResponse;
 import org.apache.druid.sql.calcite.planner.PlannerContext;
 
 import javax.annotation.Nullable;
-
 import java.util.Set;
 
 public abstract class DruidRel<T extends DruidRel<?>> extends AbstractRelNode
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java
index 606710ff53b..a2e45c4af8c 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java
@@ -110,7 +110,6 @@ import org.junit.jupiter.api.Named;
 import org.junit.jupiter.api.extension.RegisterExtension;
 
 import javax.annotation.Nullable;
-
 import java.io.File;
 import java.io.IOException;
 import java.io.InputStream;
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteCatalogIngestionDmlTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteCatalogIngestionDmlTest.java
index 621c919b0ed..514695c4afe 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteCatalogIngestionDmlTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteCatalogIngestionDmlTest.java
@@ -56,7 +56,6 @@ import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.junit.jupiter.api.Test;
 
 import javax.annotation.Nullable;
-
 import java.util.HashMap;
 import java.util.Map;
 
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteIngestionDmlTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteIngestionDmlTest.java
index 74cd5a07b26..e26803fa498 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteIngestionDmlTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteIngestionDmlTest.java
@@ -76,7 +76,6 @@ import org.junit.jupiter.api.AfterEach;
 
 import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
-
 import java.io.File;
 import java.util.ArrayList;
 import java.util.Arrays;
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/DecoupledPlanningCalciteJoinQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/DecoupledPlanningCalciteJoinQueryTest.java
index d8abfbb2075..19553104a83 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/DecoupledPlanningCalciteJoinQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/DecoupledPlanningCalciteJoinQueryTest.java
@@ -24,6 +24,7 @@ import org.junit.jupiter.api.extension.ExtendWith;
 import org.junit.jupiter.api.extension.RegisterExtension;
 import org.junit.jupiter.params.ParameterizedTest;
 import org.junit.jupiter.params.provider.MethodSource;
+
 import java.util.Map;
 
 import static org.junit.Assert.assertNotNull;
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/DecoupledTestConfig.java b/sql/src/test/java/org/apache/druid/sql/calcite/DecoupledTestConfig.java
index 9bd57e10afb..f23197d437a 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/DecoupledTestConfig.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/DecoupledTestConfig.java
@@ -22,6 +22,7 @@ package org.apache.druid.sql.calcite;
 import org.apache.calcite.rel.rules.CoreRules;
 import org.apache.druid.query.QueryContexts;
 import org.apache.druid.query.aggregation.post.FinalizingFieldAccessPostAggregator;
+
 import java.lang.annotation.ElementType;
 import java.lang.annotation.Retention;
 import java.lang.annotation.RetentionPolicy;
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java
index 5ef280e24b8..ec661f8d315 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java
@@ -72,7 +72,6 @@ import org.junit.jupiter.api.extension.RegisterExtension;
 
 import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
-
 import java.io.File;
 import java.io.IOException;
 import java.io.InputStream;
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestBuilder.java b/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestBuilder.java
index 9484fd3d892..0c3ee685732 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestBuilder.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestBuilder.java
@@ -38,6 +38,7 @@ import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SqlTestFramework;
 import org.apache.druid.sql.calcite.util.SqlTestFramework.PlannerFixture;
 import org.apache.druid.sql.http.SqlParameter;
+
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.List;
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/SqlTestFrameworkConfig.java b/sql/src/test/java/org/apache/druid/sql/calcite/SqlTestFrameworkConfig.java
index a3311d32c87..9eda5849fcf 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/SqlTestFrameworkConfig.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/SqlTestFrameworkConfig.java
@@ -41,7 +41,6 @@ import org.junit.jupiter.api.extension.ExtensionContext;
 import org.reflections.Reflections;
 
 import javax.annotation.Nonnull;
-
 import java.io.Closeable;
 import java.lang.annotation.Annotation;
 import java.lang.annotation.ElementType;
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/planner/CalcitePlannerModuleTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/planner/CalcitePlannerModuleTest.java
index 8ef3ad3106f..43d47733277 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/planner/CalcitePlannerModuleTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/planner/CalcitePlannerModuleTest.java
@@ -60,7 +60,6 @@ import org.junit.jupiter.api.extension.ExtendWith;
 
 import javax.validation.Validation;
 import javax.validation.Validator;
-
 import java.util.Collections;
 import java.util.Optional;
 import java.util.Set;
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/schema/SystemSchemaTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/schema/SystemSchemaTest.java
index c2321d52250..992d91dabe8 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/schema/SystemSchemaTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/schema/SystemSchemaTest.java
@@ -117,6 +117,7 @@ import org.junit.jupiter.api.BeforeAll;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
 import org.junit.jupiter.api.io.TempDir;
+
 import java.io.File;
 import java.io.IOException;
 import java.net.URI;
diff --git a/website/.spelling b/website/.spelling
index 31b151a921d..5825f8ddb2f 100644
--- a/website/.spelling
+++ b/website/.spelling
@@ -1665,7 +1665,6 @@ Filesystem
 JVMMonitor
 jvmVersion
 QueryCountStatsMonitor
-RealtimeMetricsMonitor
 Sys
 SysMonitor
 TaskCountStatsMonitor

From f1043d20bc10d3fd44a33ad89dac556d30095a20 Mon Sep 17 00:00:00 2001
From: Kashif Faraz <kashif.faraz@gmail.com>
Date: Mon, 24 Jun 2024 23:20:01 -0700
Subject: [PATCH 19/72] Support csv input format in Kafka ingestion with header
 (#16630)

* Support ListBasedInputRow in Kafka ingestion with header
* Fix up buildBlendedEventMap
* Add new test for KafkaInputFormat with csv value and headers
* Do not use forbidden APIs
* Move utility method to TestUtils
---
 .../input/kafkainput/KafkaInputReader.java    |  58 ++-
 .../kafkainput/KafkaInputFormatTest.java      | 350 ++++++++----------
 .../druid/indexing/common/TestUtils.java      |  18 +
 3 files changed, 197 insertions(+), 229 deletions(-)

diff --git a/extensions-core/kafka-indexing-service/src/main/java/org/apache/druid/data/input/kafkainput/KafkaInputReader.java b/extensions-core/kafka-indexing-service/src/main/java/org/apache/druid/data/input/kafkainput/KafkaInputReader.java
index 31b7cf66be1..9d356d4a2e9 100644
--- a/extensions-core/kafka-indexing-service/src/main/java/org/apache/druid/data/input/kafkainput/KafkaInputReader.java
+++ b/extensions-core/kafka-indexing-service/src/main/java/org/apache/druid/data/input/kafkainput/KafkaInputReader.java
@@ -31,7 +31,6 @@ import org.apache.druid.indexing.seekablestream.SettableByteEntity;
 import org.apache.druid.java.util.common.CloseableIterators;
 import org.apache.druid.java.util.common.Pair;
 import org.apache.druid.java.util.common.parsers.CloseableIterator;
-import org.apache.druid.java.util.common.parsers.ParseException;
 import org.joda.time.DateTime;
 
 import javax.annotation.Nullable;
@@ -171,21 +170,8 @@ public class KafkaInputReader implements InputEntityReader
   {
     return valueParser.read().map(
         r -> {
-          final MapBasedInputRow valueRow;
-          try {
-            // Return type for the value parser should be of type MapBasedInputRow
-            // Parsers returning other types are not compatible currently.
-            valueRow = (MapBasedInputRow) r;
-          }
-          catch (ClassCastException e) {
-            throw new ParseException(
-                null,
-                "Unsupported input format in valueFormat. KafkaInputFormat only supports input format that return MapBasedInputRow rows"
-            );
-          }
-
-          final Map<String, Object> event = buildBlendedEventMap(valueRow.getEvent(), headerKeyList);
-          final HashSet<String> newDimensions = new HashSet<>(valueRow.getDimensions());
+          final HashSet<String> newDimensions = new HashSet<>(r.getDimensions());
+          final Map<String, Object> event = buildBlendedEventMap(r::getRaw, newDimensions, headerKeyList);
           newDimensions.addAll(headerKeyList.keySet());
           // Remove the dummy timestamp added in KafkaInputFormat
           newDimensions.remove(KafkaInputFormat.DEFAULT_AUTO_TIMESTAMP_STRING);
@@ -244,25 +230,18 @@ public class KafkaInputReader implements InputEntityReader
           }
           List<InputRow> newInputRows = Lists.newArrayListWithCapacity(rowAndValues.getInputRows().size());
           List<Map<String, Object>> newRawRows = Lists.newArrayListWithCapacity(rowAndValues.getRawValues().size());
-          ParseException parseException = null;
 
           for (Map<String, Object> raw : rowAndValues.getRawValuesList()) {
-            newRawRows.add(buildBlendedEventMap(raw, headerKeyList));
+            newRawRows.add(buildBlendedEventMap(raw::get, raw.keySet(), headerKeyList));
           }
           for (InputRow r : rowAndValues.getInputRows()) {
-            MapBasedInputRow valueRow = null;
-            try {
-              valueRow = (MapBasedInputRow) r;
-            }
-            catch (ClassCastException e) {
-              parseException = new ParseException(
-                  null,
-                  "Unsupported input format in valueFormat. KafkaInputFormat only supports input format that return MapBasedInputRow rows"
+            if (r != null) {
+              final HashSet<String> newDimensions = new HashSet<>(r.getDimensions());
+              final Map<String, Object> event = buildBlendedEventMap(
+                  r::getRaw,
+                  newDimensions,
+                  headerKeyList
               );
-            }
-            if (valueRow != null) {
-              final Map<String, Object> event = buildBlendedEventMap(valueRow.getEvent(), headerKeyList);
-              final HashSet<String> newDimensions = new HashSet<>(valueRow.getDimensions());
               newDimensions.addAll(headerKeyList.keySet());
               // Remove the dummy timestamp added in KafkaInputFormat
               newDimensions.remove(KafkaInputFormat.DEFAULT_AUTO_TIMESTAMP_STRING);
@@ -279,7 +258,7 @@ public class KafkaInputReader implements InputEntityReader
               );
             }
           }
-          return InputRowListPlusRawValues.ofList(newRawRows, newInputRows, parseException);
+          return InputRowListPlusRawValues.ofList(newRawRows, newInputRows, null);
         }
     );
   }
@@ -302,22 +281,31 @@ public class KafkaInputReader implements InputEntityReader
   /**
    * Builds a map that blends two {@link Map}, presenting the combined keyset of both maps, and preferring to read
    * from the first map and falling back to the second map if the value is not present.
-   *
+   * <p>
    * This strategy is used rather than just copying the values of the keyset into a new map so that any 'flattening'
    * machinery (such as {@link Map} created by {@link org.apache.druid.java.util.common.parsers.ObjectFlatteners}) is
    * still in place to be lazily evaluated instead of eagerly copying.
    */
-  private static Map<String, Object> buildBlendedEventMap(Map<String, Object> map, Map<String, Object> fallback)
+  private static Map<String, Object> buildBlendedEventMap(
+      Function<String, Object> getRowValue,
+      Set<String> rowDimensions,
+      Map<String, Object> fallback
+  )
   {
     final Set<String> keySet = new HashSet<>(fallback.keySet());
-    keySet.addAll(map.keySet());
+    keySet.addAll(rowDimensions);
 
     return new AbstractMap<String, Object>()
     {
       @Override
       public Object get(Object key)
       {
-        return map.getOrDefault((String) key, fallback.get(key));
+        final String skey = (String) key;
+        final Object val = getRowValue.apply(skey);
+        if (val == null) {
+          return fallback.get(skey);
+        }
+        return val;
       }
 
       @Override
diff --git a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/data/input/kafkainput/KafkaInputFormatTest.java b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/data/input/kafkainput/KafkaInputFormatTest.java
index 858cd79fbd7..adbb7c4b677 100644
--- a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/data/input/kafkainput/KafkaInputFormatTest.java
+++ b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/data/input/kafkainput/KafkaInputFormatTest.java
@@ -24,14 +24,17 @@ import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.Iterables;
+import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.ColumnsFilter;
 import org.apache.druid.data.input.InputEntityReader;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.data.input.InputRowSchema;
+import org.apache.druid.data.input.impl.CsvInputFormat;
 import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.data.input.impl.JsonInputFormat;
 import org.apache.druid.data.input.impl.TimestampSpec;
 import org.apache.druid.data.input.kafka.KafkaRecordEntity;
+import org.apache.druid.indexing.common.TestUtils;
 import org.apache.druid.indexing.seekablestream.SettableByteEntity;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.StringUtils;
@@ -57,9 +60,29 @@ import java.util.Optional;
 
 public class KafkaInputFormatTest
 {
-  private KafkaRecordEntity inputEntity;
-  private final long timestamp = DateTimes.of("2021-06-24").getMillis();
+  static {
+    NullHandling.initializeForTests();
+  }
+
+  private static final long TIMESTAMP_MILLIS = DateTimes.of("2021-06-24").getMillis();
   private static final String TOPIC = "sample";
+  private static final byte[] SIMPLE_JSON_KEY_BYTES = StringUtils.toUtf8(
+      TestUtils.singleQuoteToStandardJson(
+          "{'key': 'sampleKey'}"
+      )
+  );
+  private static final byte[] SIMPLE_JSON_VALUE_BYTES = StringUtils.toUtf8(
+      TestUtils.singleQuoteToStandardJson(
+          "{"
+          + "    'timestamp': '2021-06-25',"
+          + "    'bar': null,"
+          + "    'foo': 'x',"
+          + "    'baz': 4,"
+          + "    'o': {'mg': 1}"
+          + "}"
+      )
+  );
+
   private static final Iterable<Header> SAMPLE_HEADERS = ImmutableList.of(
       new Header()
       {
@@ -177,26 +200,9 @@ public class KafkaInputFormatTest
   @Test
   public void testWithHeaderKeyAndValue() throws IOException
   {
-    final byte[] key = StringUtils.toUtf8(
-        "{\n"
-        + "    \"key\": \"sampleKey\"\n"
-        + "}"
-    );
-
-    final byte[] payload = StringUtils.toUtf8(
-        "{\n"
-        + "    \"timestamp\": \"2021-06-25\",\n"
-        + "    \"bar\": null,\n"
-        + "    \"foo\": \"x\",\n"
-        + "    \"baz\": 4,\n"
-        + "    \"o\": {\n"
-        + "        \"mg\": 1\n"
-        + "    }\n"
-        + "}"
-    );
-
     Headers headers = new RecordHeaders(SAMPLE_HEADERS);
-    inputEntity = makeInputEntity(key, payload, headers);
+    KafkaRecordEntity inputEntity =
+        makeInputEntity(SIMPLE_JSON_KEY_BYTES, SIMPLE_JSON_VALUE_BYTES, headers);
 
     final InputEntityReader reader = format.createReader(
         new InputRowSchema(
@@ -248,21 +254,7 @@ public class KafkaInputFormatTest
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("jq_omg")));
         Assert.assertEquals(ImmutableMap.of("mg", 1L), row.getRaw("o"));
 
-        // Header verification
-        Assert.assertEquals("application/json", Iterables.getOnlyElement(row.getDimension("kafka.newheader.encoding")));
-        Assert.assertEquals("pkc-bar", Iterables.getOnlyElement(row.getDimension("kafka.newheader.kafkapkc")));
-        Assert.assertEquals(
-            String.valueOf(DateTimes.of("2021-06-24").getMillis()),
-            Iterables.getOnlyElement(row.getDimension("kafka.newts.timestamp"))
-        );
-        Assert.assertEquals(
-            TOPIC,
-            Iterables.getOnlyElement(row.getDimension("kafka.newtopic.topic"))
-        );
-        Assert.assertEquals(
-            "2021-06-25",
-            Iterables.getOnlyElement(row.getDimension("timestamp"))
-        );
+        verifyHeader(row);
 
         // Key verification
         Assert.assertEquals("sampleKey", Iterables.getOnlyElement(row.getDimension("kafka.newkey.key")));
@@ -282,20 +274,8 @@ public class KafkaInputFormatTest
   //Headers cannot be null, so testing only no key use case!
   public void testWithOutKey() throws IOException
   {
-    final byte[] payload = StringUtils.toUtf8(
-        "{\n"
-        + "    \"timestamp\": \"2021-06-24\",\n"
-        + "    \"bar\": null,\n"
-        + "    \"foo\": \"x\",\n"
-        + "    \"baz\": 4,\n"
-        + "    \"o\": {\n"
-        + "        \"mg\": 1\n"
-        + "    }\n"
-        + "}"
-    );
-
     Headers headers = new RecordHeaders(SAMPLE_HEADERS);
-    inputEntity = makeInputEntity(null, payload, headers);
+    KafkaRecordEntity inputEntity = makeInputEntity(null, SIMPLE_JSON_VALUE_BYTES, headers);
 
     final InputEntityReader reader = format.createReader(
         new InputRowSchema(
@@ -338,7 +318,7 @@ public class KafkaInputFormatTest
   @Test
   public void testTimestampFromHeader() throws IOException
   {
-    Iterable<Header> sample_header_with_ts = Iterables.unmodifiableIterable(
+    final Iterable<Header> sampleHeaderWithTs = Iterables.unmodifiableIterable(
         Iterables.concat(
             SAMPLE_HEADERS,
             ImmutableList.of(
@@ -359,26 +339,9 @@ public class KafkaInputFormatTest
             )
         )
     );
-    final byte[] key = StringUtils.toUtf8(
-        "{\n"
-        + "    \"key\": \"sampleKey\"\n"
-        + "}"
-    );
-
-    final byte[] payload = StringUtils.toUtf8(
-        "{\n"
-        + "    \"timestamp\": \"2021-06-24\",\n"
-        + "    \"bar\": null,\n"
-        + "    \"foo\": \"x\",\n"
-        + "    \"baz\": 4,\n"
-        + "    \"o\": {\n"
-        + "        \"mg\": 1\n"
-        + "    }\n"
-        + "}"
-    );
-
-    Headers headers = new RecordHeaders(sample_header_with_ts);
-    inputEntity = makeInputEntity(key, payload, headers);
+    Headers headers = new RecordHeaders(sampleHeaderWithTs);
+    KafkaRecordEntity inputEntity =
+        makeInputEntity(SIMPLE_JSON_KEY_BYTES, SIMPLE_JSON_VALUE_BYTES, headers);
 
     final InputEntityReader reader = format.createReader(
         new InputRowSchema(
@@ -417,21 +380,7 @@ public class KafkaInputFormatTest
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("jq_omg")));
         Assert.assertEquals(ImmutableMap.of("mg", 1L), row.getRaw("o"));
 
-        // Header verification
-        Assert.assertEquals("application/json", Iterables.getOnlyElement(row.getDimension("kafka.newheader.encoding")));
-        Assert.assertEquals("pkc-bar", Iterables.getOnlyElement(row.getDimension("kafka.newheader.kafkapkc")));
-        Assert.assertEquals(
-            String.valueOf(DateTimes.of("2021-06-24").getMillis()),
-            Iterables.getOnlyElement(row.getDimension("kafka.newts.timestamp"))
-        );
-        Assert.assertEquals(
-            "2021-06-24",
-            Iterables.getOnlyElement(row.getDimension("kafka.newheader.headerTs"))
-        );
-        Assert.assertEquals(
-            "2021-06-24",
-            Iterables.getOnlyElement(row.getDimension("timestamp"))
-        );
+        verifyHeader(row);
 
         // Key verification
         Assert.assertEquals("sampleKey", Iterables.getOnlyElement(row.getDimension("kafka.newkey.key")));
@@ -450,20 +399,9 @@ public class KafkaInputFormatTest
   @Test
   public void testWithOutKeyAndHeaderSpecs() throws IOException
   {
-    final byte[] payload = StringUtils.toUtf8(
-        "{\n"
-        + "    \"timestamp\": \"2021-06-24\",\n"
-        + "    \"bar\": null,\n"
-        + "    \"foo\": \"x\",\n"
-        + "    \"baz\": 4,\n"
-        + "    \"o\": {\n"
-        + "        \"mg\": 1\n"
-        + "    }\n"
-        + "}"
-    );
-
     Headers headers = new RecordHeaders(SAMPLE_HEADERS);
-    inputEntity = makeInputEntity(null, payload, headers);
+    KafkaRecordEntity inputEntity =
+        makeInputEntity(null, SIMPLE_JSON_VALUE_BYTES, headers);
 
     KafkaInputFormat localFormat = new KafkaInputFormat(
         null,
@@ -590,7 +528,7 @@ public class KafkaInputFormatTest
     for (int i = 0; i < keys.length; i++) {
       headers = headers.add(new RecordHeader("indexH", String.valueOf(i).getBytes(StandardCharsets.UTF_8)));
 
-      inputEntity = makeInputEntity(keys[i], values[i], headers);
+      KafkaRecordEntity inputEntity = makeInputEntity(keys[i], values[i], headers);
       settableByteEntity.setEntity(inputEntity);
 
       final int numExpectedIterations = 1;
@@ -612,7 +550,6 @@ public class KafkaInputFormatTest
           Assert.assertEquals(ImmutableMap.of("mg", 1L), row.getRaw("o"));
           Assert.assertEquals(String.valueOf(i), Iterables.getOnlyElement(row.getDimension("index")));
 
-
           // Header verification
           Assert.assertEquals(
               "application/json",
@@ -652,26 +589,9 @@ public class KafkaInputFormatTest
   @Test
   public void testMissingTimestampThrowsException() throws IOException
   {
-    final byte[] key = StringUtils.toUtf8(
-        "{\n"
-        + "    \"key\": \"sampleKey\"\n"
-        + "}"
-    );
-
-    final byte[] payload = StringUtils.toUtf8(
-        "{\n"
-        + "    \"timestamp\": \"2021-06-25\",\n"
-        + "    \"bar\": null,\n"
-        + "    \"foo\": \"x\",\n"
-        + "    \"baz\": 4,\n"
-        + "    \"o\": {\n"
-        + "        \"mg\": 1\n"
-        + "    }\n"
-        + "}"
-    );
-
     Headers headers = new RecordHeaders(SAMPLE_HEADERS);
-    inputEntity = makeInputEntity(key, payload, headers);
+    KafkaRecordEntity inputEntity =
+        makeInputEntity(SIMPLE_JSON_KEY_BYTES, SIMPLE_JSON_VALUE_BYTES, headers);
 
     final InputEntityReader reader = format.createReader(
         new InputRowSchema(
@@ -696,11 +616,9 @@ public class KafkaInputFormatTest
 
     try (CloseableIterator<InputRow> iterator = reader.read()) {
       while (iterator.hasNext()) {
-        Throwable t = Assert.assertThrows(ParseException.class, () -> iterator.next());
-        Assert.assertEquals(
-            "Timestamp[null] is unparseable! Event: {kafka.newtopic.topic=sample, foo=x, kafka.newts"
-            + ".timestamp=1624492800000, kafka.newkey.key=sampleKey...",
-            t.getMessage()
+        Throwable t = Assert.assertThrows(ParseException.class, iterator::next);
+        Assert.assertTrue(
+            t.getMessage().startsWith("Timestamp[null] is unparseable! Event: {")
         );
       }
     }
@@ -709,27 +627,9 @@ public class KafkaInputFormatTest
   @Test
   public void testWithSchemaDiscovery() throws IOException
   {
-    // testWithHeaderKeyAndValue + schemaless
-    final byte[] key = StringUtils.toUtf8(
-        "{\n"
-        + "    \"key\": \"sampleKey\"\n"
-        + "}"
-    );
-
-    final byte[] payload = StringUtils.toUtf8(
-        "{\n"
-        + "    \"timestamp\": \"2021-06-25\",\n"
-        + "    \"bar\": null,\n"
-        + "    \"foo\": \"x\",\n"
-        + "    \"baz\": 4,\n"
-        + "    \"o\": {\n"
-        + "        \"mg\": 1\n"
-        + "    }\n"
-        + "}"
-    );
-
     Headers headers = new RecordHeaders(SAMPLE_HEADERS);
-    inputEntity = makeInputEntity(key, payload, headers);
+    KafkaRecordEntity inputEntity =
+        makeInputEntity(SIMPLE_JSON_KEY_BYTES, SIMPLE_JSON_VALUE_BYTES, headers);
 
     final InputEntityReader reader = format.createReader(
         new InputRowSchema(
@@ -777,21 +677,7 @@ public class KafkaInputFormatTest
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("jq_omg")));
         Assert.assertEquals(ImmutableMap.of("mg", 1L), row.getRaw("o"));
 
-        // Header verification
-        Assert.assertEquals("application/json", Iterables.getOnlyElement(row.getDimension("kafka.newheader.encoding")));
-        Assert.assertEquals("pkc-bar", Iterables.getOnlyElement(row.getDimension("kafka.newheader.kafkapkc")));
-        Assert.assertEquals(
-            String.valueOf(DateTimes.of("2021-06-24").getMillis()),
-            Iterables.getOnlyElement(row.getDimension("kafka.newts.timestamp"))
-        );
-        Assert.assertEquals(
-            TOPIC,
-            Iterables.getOnlyElement(row.getDimension("kafka.newtopic.topic"))
-        );
-        Assert.assertEquals(
-            "2021-06-25",
-            Iterables.getOnlyElement(row.getDimension("timestamp"))
-        );
+        verifyHeader(row);
 
         // Key verification
         Assert.assertEquals("sampleKey", Iterables.getOnlyElement(row.getDimension("kafka.newkey.key")));
@@ -808,29 +694,102 @@ public class KafkaInputFormatTest
   }
 
   @Test
-  public void testWithPartialDeclarationSchemaDiscovery() throws IOException
+  public void testValueInCsvFormat() throws IOException
   {
-    // testWithHeaderKeyAndValue + partial-schema + schema discovery
-    final byte[] key = StringUtils.toUtf8(
-        "{\n"
-        + "    \"key\": \"sampleKey\"\n"
-        + "}"
-    );
-
-    final byte[] payload = StringUtils.toUtf8(
-        "{\n"
-        + "    \"timestamp\": \"2021-06-25\",\n"
-        + "    \"bar\": null,\n"
-        + "    \"foo\": \"x\",\n"
-        + "    \"baz\": 4,\n"
-        + "    \"o\": {\n"
-        + "        \"mg\": 1\n"
-        + "    }\n"
-        + "}"
+    format = new KafkaInputFormat(
+        new KafkaStringHeaderFormat(null),
+        // Key Format
+        new JsonInputFormat(
+            new JSONPathSpec(true, ImmutableList.of()),
+            null,
+            null,
+            false,
+            false
+        ),
+        // Value Format
+        new CsvInputFormat(
+            Arrays.asList("foo", "bar", "timestamp", "baz"),
+            null,
+            false,
+            false,
+            0
+        ),
+        "kafka.newheader.",
+        "kafka.newkey.key",
+        "kafka.newts.timestamp",
+        "kafka.newtopic.topic"
     );
 
     Headers headers = new RecordHeaders(SAMPLE_HEADERS);
-    inputEntity = makeInputEntity(key, payload, headers);
+    KafkaRecordEntity inputEntity =
+        makeInputEntity(SIMPLE_JSON_KEY_BYTES, StringUtils.toUtf8("x,,2021-06-25,4"), headers);
+
+    final InputEntityReader reader = format.createReader(
+        new InputRowSchema(
+            new TimestampSpec("timestamp", "iso", null),
+            new DimensionsSpec(
+                DimensionsSpec.getDefaultSchemas(
+                    ImmutableList.of(
+                        "bar",
+                        "foo",
+                        "kafka.newheader.encoding",
+                        "kafka.newheader.kafkapkc",
+                        "kafka.newts.timestamp",
+                        "kafka.newtopic.topic"
+                    )
+                )
+            ),
+            ColumnsFilter.all()
+        ),
+        newSettableByteEntity(inputEntity),
+        null
+    );
+
+    final int numExpectedIterations = 1;
+    try (CloseableIterator<InputRow> iterator = reader.read()) {
+      int numActualIterations = 0;
+      while (iterator.hasNext()) {
+
+        final InputRow row = iterator.next();
+        Assert.assertEquals(
+            Arrays.asList(
+                "bar",
+                "foo",
+                "kafka.newheader.encoding",
+                "kafka.newheader.kafkapkc",
+                "kafka.newts.timestamp",
+                "kafka.newtopic.topic"
+            ),
+            row.getDimensions()
+        );
+        // Payload verifications
+        // this isn't super realistic, since most of these columns are not actually defined in the dimensionSpec
+        // but test reading them anyway since it isn't technically illegal
+
+        Assert.assertEquals(DateTimes.of("2021-06-25"), row.getTimestamp());
+        Assert.assertEquals("x", Iterables.getOnlyElement(row.getDimension("foo")));
+        Assert.assertEquals("4", Iterables.getOnlyElement(row.getDimension("baz")));
+        Assert.assertTrue(row.getDimension("bar").isEmpty());
+
+        verifyHeader(row);
+
+        // Key verification
+        Assert.assertEquals("sampleKey", Iterables.getOnlyElement(row.getDimension("kafka.newkey.key")));
+
+        numActualIterations++;
+      }
+
+      Assert.assertEquals(numExpectedIterations, numActualIterations);
+    }
+  }
+
+  @Test
+  public void testWithPartialDeclarationSchemaDiscovery() throws IOException
+  {
+    // testWithHeaderKeyAndValue + partial-schema + schema discovery
+    Headers headers = new RecordHeaders(SAMPLE_HEADERS);
+    KafkaRecordEntity inputEntity =
+        makeInputEntity(SIMPLE_JSON_KEY_BYTES, SIMPLE_JSON_VALUE_BYTES, headers);
 
     final InputEntityReader reader = format.createReader(
         new InputRowSchema(
@@ -881,21 +840,7 @@ public class KafkaInputFormatTest
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("jq_omg")));
         Assert.assertEquals(ImmutableMap.of("mg", 1L), row.getRaw("o"));
 
-        // Header verification
-        Assert.assertEquals("application/json", Iterables.getOnlyElement(row.getDimension("kafka.newheader.encoding")));
-        Assert.assertEquals("pkc-bar", Iterables.getOnlyElement(row.getDimension("kafka.newheader.kafkapkc")));
-        Assert.assertEquals(
-            String.valueOf(DateTimes.of("2021-06-24").getMillis()),
-            Iterables.getOnlyElement(row.getDimension("kafka.newts.timestamp"))
-        );
-        Assert.assertEquals(
-            TOPIC,
-            Iterables.getOnlyElement(row.getDimension("kafka.newtopic.topic"))
-        );
-        Assert.assertEquals(
-            "2021-06-25",
-            Iterables.getOnlyElement(row.getDimension("timestamp"))
-        );
+        verifyHeader(row);
 
         // Key verification
         Assert.assertEquals("sampleKey", Iterables.getOnlyElement(row.getDimension("kafka.newkey.key")));
@@ -918,7 +863,7 @@ public class KafkaInputFormatTest
             TOPIC,
             0,
             0,
-            timestamp,
+            TIMESTAMP_MILLIS,
             null,
             0,
             0,
@@ -930,6 +875,23 @@ public class KafkaInputFormatTest
     );
   }
 
+  private void verifyHeader(InputRow row)
+  {
+    Assert.assertEquals("application/json", Iterables.getOnlyElement(row.getDimension("kafka.newheader.encoding")));
+    Assert.assertEquals("pkc-bar", Iterables.getOnlyElement(row.getDimension("kafka.newheader.kafkapkc")));
+    Assert.assertEquals(
+        String.valueOf(DateTimes.of("2021-06-24").getMillis()),
+        Iterables.getOnlyElement(row.getDimension("kafka.newts.timestamp"))
+    );
+    Assert.assertEquals(
+        TOPIC,
+        Iterables.getOnlyElement(row.getDimension("kafka.newtopic.topic"))
+    );
+    Assert.assertEquals(
+        "2021-06-25",
+        Iterables.getOnlyElement(row.getDimension("timestamp"))
+    );
+  }
 
   private SettableByteEntity<KafkaRecordEntity> newSettableByteEntity(KafkaRecordEntity kafkaRecordEntity)
   {
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/TestUtils.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/TestUtils.java
index bac4261e0fa..7dda3b8ff62 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/TestUtils.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/TestUtils.java
@@ -36,6 +36,7 @@ import org.apache.druid.indexing.common.task.TestAppenderatorsManager;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexSupervisorTaskClientProvider;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.expression.LookupEnabledTestExprMacroTable;
@@ -174,4 +175,21 @@ public class TestUtils
     }
     return true;
   }
+
+  /**
+   * Converts the given JSON string which uses single quotes for field names and
+   * String values to a standard JSON by replacing all occurrences of a single
+   * quote with double quotes.
+   * <p>
+   * Single-quoted JSON is typically easier to read as can be seen below:
+   * <pre>
+   * final String singleQuotedJson = "{'f1':'value', 'f2':5}";
+   *
+   * final String doubleQuotedJson = "{\"f1\":\"value\", \"f2\":5}";
+   * </pre>
+   */
+  public static String singleQuoteToStandardJson(String singleQuotedJson)
+  {
+    return StringUtils.replaceChar(singleQuotedJson, '\'', "\"");
+  }
 }

From 2979f73e897693e7c85eeffb2b1384e2ba1c778c Mon Sep 17 00:00:00 2001
From: Abhishek Radhakrishnan <abhishek.rb19@gmail.com>
Date: Tue, 25 Jun 2024 04:32:43 -0700
Subject: [PATCH 20/72] Fix Intellij inspection (#16651)

---
 .../metadata/IndexerSQLMetadataStorageCoordinatorTest.java      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
index 4c2fc76533e..a782a72e646 100644
--- a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
+++ b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
@@ -3257,7 +3257,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
   }
 
   @Test
-  public void testRetrieveUnusedSegmentsForExactIntervalAndVersion() throws Exception
+  public void testRetrieveUnusedSegmentsForExactIntervalAndVersion()
   {
     DataSegment unusedForDifferentVersion = createSegment(
         Intervals.of("2024/2025"),

From b43f4063c5ae097c4cefe9159905a69b1fa6c2e1 Mon Sep 17 00:00:00 2001
From: Edgar Melendrez <evmelendrez@gmail.com>
Date: Tue, 25 Jun 2024 09:07:00 -0700
Subject: [PATCH 21/72] Docs: update link and title of quickstart (#16638)

* update link and title

* Discard changes to website/package.json

* Apply suggestions from code review

Co-authored-by: Charles Smith <techdocsmith@gmail.com>

---------

Co-authored-by: Victoria Lim <vtlim@users.noreply.github.com>
Co-authored-by: Charles Smith <techdocsmith@gmail.com>
---
 docs/tutorials/index.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/tutorials/index.md b/docs/tutorials/index.md
index 480ad5aced1..90e9836e28a 100644
--- a/docs/tutorials/index.md
+++ b/docs/tutorials/index.md
@@ -1,7 +1,7 @@
 ---
 id: index
-title: "Quickstart (local)"
-sidebar_label: Quickstart (local)
+title: "Local quickstart"
+sidebar_label: Local quickstart
 ---
 
 <!--
@@ -53,7 +53,7 @@ dedicated user account for running Druid.
 
 ## Install Druid
 
-Download the [{{DRUIDVERSION}} release](https://www.apache.org/dyn/closer.cgi?path=/druid/{{DRUIDVERSION}}/apache-druid-{{DRUIDVERSION}}-bin.tar.gz) from Apache Druid. 
+Download the [{{DRUIDVERSION}} release](https://druid.apache.org/downloads/) from Apache Druid. 
 
 In your terminal, extract the file and change directories to the distribution directory:
 

From e01f1552098070616b1f8c695d5d42c9733d0727 Mon Sep 17 00:00:00 2001
From: Abhishek Radhakrishnan <abhishek.rb19@gmail.com>
Date: Tue, 25 Jun 2024 09:16:13 -0700
Subject: [PATCH 22/72] Add missing `delta-storage` dependency and class loader
 workaround to Delta table ingestion (#16648)

* Workaround to ingesting from Delta table in 3.2.0.

With the upgrade to Kernel 3.2.0, the Druid Delta connector extension
isn't able to ingest from Delta tables successfully.

Please see https://github.com/delta-io/delta/issues/3299

The underlying problem seems to be coming from
https://github.com/delta-io/delta/blob/master/kernel/kernel-defaults/src/main/java/io/delta/kernel/defaults/internal/logstore/LogStoreProvider.java#L99

This patch is a workaround to setting the thread class loader explictly.
The Kernel community may consider a fix in the next release as it's affected another
connector as well.

* Address review comment: clear the CL after the Thread CL is set.
---
 .../druid-deltalake-extensions/pom.xml        |  7 ++++++-
 .../druid/delta/input/DeltaInputSource.java   | 21 +++++++++++++++++--
 2 files changed, 25 insertions(+), 3 deletions(-)

diff --git a/extensions-contrib/druid-deltalake-extensions/pom.xml b/extensions-contrib/druid-deltalake-extensions/pom.xml
index 053f6556573..71a167c315e 100644
--- a/extensions-contrib/druid-deltalake-extensions/pom.xml
+++ b/extensions-contrib/druid-deltalake-extensions/pom.xml
@@ -44,12 +44,17 @@
       <artifactId>delta-kernel-api</artifactId>
       <version>${delta-kernel.version}</version>
     </dependency>
-
     <dependency>
       <groupId>io.delta</groupId>
       <artifactId>delta-kernel-defaults</artifactId>
       <version>${delta-kernel.version}</version>
     </dependency>
+    <dependency>
+      <groupId>io.delta</groupId>
+      <artifactId>delta-storage</artifactId>
+      <version>${delta-kernel.version}</version>
+    </dependency>
+
     <dependency>
       <groupId>org.apache.hadoop</groupId>
       <artifactId>hadoop-client-api</artifactId>
diff --git a/extensions-contrib/druid-deltalake-extensions/src/main/java/org/apache/druid/delta/input/DeltaInputSource.java b/extensions-contrib/druid-deltalake-extensions/src/main/java/org/apache/druid/delta/input/DeltaInputSource.java
index 7d126caef34..01a18e9bc85 100644
--- a/extensions-contrib/druid-deltalake-extensions/src/main/java/org/apache/druid/delta/input/DeltaInputSource.java
+++ b/extensions-contrib/druid-deltalake-extensions/src/main/java/org/apache/druid/delta/input/DeltaInputSource.java
@@ -42,6 +42,7 @@ import io.delta.kernel.types.StructField;
 import io.delta.kernel.types.StructType;
 import io.delta.kernel.utils.CloseableIterator;
 import io.delta.kernel.utils.FileStatus;
+import io.delta.storage.LogStore;
 import org.apache.druid.data.input.ColumnsFilter;
 import org.apache.druid.data.input.InputFormat;
 import org.apache.druid.data.input.InputRowSchema;
@@ -151,7 +152,8 @@ public class DeltaInputSource implements SplittableInputSource<DeltaSplit>
         }
       } else {
         final Table table = Table.forPath(engine, tablePath);
-        final Snapshot latestSnapshot = table.getLatestSnapshot(engine);
+        final Snapshot latestSnapshot = getLatestSnapshotForTable(table, engine);
+
         final StructType fullSnapshotSchema = latestSnapshot.getSchema(engine);
         final StructType prunedSchema = pruneSchema(
             fullSnapshotSchema,
@@ -207,7 +209,7 @@ public class DeltaInputSource implements SplittableInputSource<DeltaSplit>
     final Snapshot latestSnapshot;
     final Table table = Table.forPath(engine, tablePath);
     try {
-      latestSnapshot = table.getLatestSnapshot(engine);
+      latestSnapshot = getLatestSnapshotForTable(table, engine);
     }
     catch (TableNotFoundException e) {
       throw InvalidInput.exception(e, "tablePath[%s] not found.", tablePath);
@@ -331,6 +333,21 @@ public class DeltaInputSource implements SplittableInputSource<DeltaSplit>
     );
   }
 
+  private Snapshot getLatestSnapshotForTable(final Table table, final Engine engine)
+  {
+    // Setting the LogStore class loader before calling the Delta Kernel snapshot API is required as a workaround with
+    // the 3.2.0 Delta Kernel because the Kernel library cannot instantiate the LogStore class otherwise. Please see
+    // https://github.com/delta-io/delta/issues/3299 for details. This workaround can be removed once the issue is fixed.
+    final ClassLoader currCtxCl = Thread.currentThread().getContextClassLoader();
+    try {
+      Thread.currentThread().setContextClassLoader(LogStore.class.getClassLoader());
+      return table.getLatestSnapshot(engine);
+    }
+    finally {
+      Thread.currentThread().setContextClassLoader(currCtxCl);
+    }
+  }
+
   @VisibleForTesting
   String getTablePath()
   {

From 52c9929019cf2d75d92cdf267ec27271e45012b5 Mon Sep 17 00:00:00 2001
From: Tom <tom.fenwick@imply.io>
Date: Tue, 25 Jun 2024 13:42:52 -0700
Subject: [PATCH 23/72] Column name in parse exceptions (#16529)

* first pass

* more changes

* fix tests and formatting

* fix kinesis failing tests

* fix kafka tests

* add dimension name to float parse errors

* double and convertToType handling of dimensionName can report parse errors with dimension name

* fix checkstyle issue

* fix tests

* more cases to have better parse exception messages

* fix test

* fix tests

* partially address comments

* annotate method parameter with nullable

* address comments

* fix tests

* let float, double, long dimensionIndexer pass dimensionName down to dimensionHandlerUtils

* fix compilation error and clean up formatting

* clean up whitespace

* address feedback. undo change, pass down report parse exception for convertToType

* fix test
---
 .../indexing/kafka/KafkaIndexTaskTest.java    |   4 +-
 .../kinesis/KinesisIndexTaskTest.java         |   4 +-
 .../druid/indexer/InputRowSerdeTest.java      |   6 +-
 .../indexing/common/task/IndexTaskTest.java   |   4 +-
 .../druid/segment/DimensionHandlerUtils.java  | 303 ++++++++++++++----
 .../druid/segment/DoubleDimensionHandler.java |   2 +-
 .../druid/segment/DoubleDimensionIndexer.java |  16 +-
 .../druid/segment/FloatDimensionHandler.java  |   2 +-
 .../druid/segment/FloatDimensionIndexer.java  |  16 +-
 .../druid/segment/LongDimensionHandler.java   |   2 +-
 .../druid/segment/LongDimensionIndexer.java   |  16 +-
 .../incremental/IncrementalIndexTest.java     |  12 +-
 .../druid/sql/calcite/run/SqlResults.java     |   6 +-
 13 files changed, 293 insertions(+), 100 deletions(-)

diff --git a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/KafkaIndexTaskTest.java b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/KafkaIndexTaskTest.java
index 1309ed0dde0..58f982e71b4 100644
--- a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/KafkaIndexTaskTest.java
+++ b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/KafkaIndexTaskTest.java
@@ -1634,8 +1634,8 @@ public class KafkaIndexTaskTest extends SeekableStreamIndexTaskTestBase
 
     List<String> expectedMessages = Arrays.asList(
         "Unable to parse value[notanumber] for field[met1]",
-        "could not convert value [notanumber] to float",
-        "could not convert value [notanumber] to long",
+        "Could not convert value [notanumber] to float for dimension [dimFloat].",
+        "Could not convert value [notanumber] to long for dimension [dimLong].",
         "Unable to parse [] as the intermediateRow resulted in empty input row (Record: 1)",
         "Unable to parse row [unparseable] (Record: 1)",
         "Encountered row with timestamp[246140482-04-24T15:36:27.903Z] that cannot be represented as a long: [{timestamp=246140482-04-24T15:36:27.903Z, dim1=x, dim2=z, dimLong=10, dimFloat=20.0, met1=1.0}] (Record: 1)"
diff --git a/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/KinesisIndexTaskTest.java b/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/KinesisIndexTaskTest.java
index c1adf018b21..527a6738ffe 100644
--- a/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/KinesisIndexTaskTest.java
+++ b/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/KinesisIndexTaskTest.java
@@ -1201,8 +1201,8 @@ public class KinesisIndexTaskTest extends SeekableStreamIndexTaskTestBase
 
     List<String> expectedMessages = Arrays.asList(
         "Unable to parse value[notanumber] for field[met1]",
-        "could not convert value [notanumber] to float",
-        "could not convert value [notanumber] to long",
+        "Could not convert value [notanumber] to float for dimension [dimFloat].",
+        "Could not convert value [notanumber] to long for dimension [dimLong].",
         "Timestamp[null] is unparseable! Event: {} (Record: 1)",
         "Unable to parse [] as the intermediateRow resulted in empty input row (Record: 1)",
         "Unable to parse row [unparseable] (Record: 1)",
diff --git a/indexing-hadoop/src/test/java/org/apache/druid/indexer/InputRowSerdeTest.java b/indexing-hadoop/src/test/java/org/apache/druid/indexer/InputRowSerdeTest.java
index 31891c04dd3..4ff03c77e95 100644
--- a/indexing-hadoop/src/test/java/org/apache/druid/indexer/InputRowSerdeTest.java
+++ b/indexing-hadoop/src/test/java/org/apache/druid/indexer/InputRowSerdeTest.java
@@ -220,7 +220,7 @@ public class InputRowSerdeTest
     );
     result = InputRowSerde.toBytes(InputRowSerde.getTypeHelperMap(dimensionsSpec), in, aggregatorFactories);
     Assert.assertEquals(
-        Collections.singletonList("could not convert value [d1v] to long"),
+        Collections.singletonList("Could not convert value [d1v] to long."),
         result.getParseExceptionMessages()
     );
 
@@ -231,7 +231,7 @@ public class InputRowSerdeTest
     );
     result = InputRowSerde.toBytes(InputRowSerde.getTypeHelperMap(dimensionsSpec), in, aggregatorFactories);
     Assert.assertEquals(
-        Collections.singletonList("could not convert value [d1v] to float"),
+        Collections.singletonList("Could not convert value [d1v] to float."),
         result.getParseExceptionMessages()
     );
 
@@ -242,7 +242,7 @@ public class InputRowSerdeTest
     );
     result = InputRowSerde.toBytes(InputRowSerde.getTypeHelperMap(dimensionsSpec), in, aggregatorFactories);
     Assert.assertEquals(
-        Collections.singletonList("could not convert value [d1v] to double"),
+        Collections.singletonList("Could not convert value [d1v] to double."),
         result.getParseExceptionMessages()
     );
   }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java
index f0e0198e35b..1a5cf19a21a 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java
@@ -1603,8 +1603,8 @@ public class IndexTaskTest extends IngestionTestBase
             tmpFile.toURI()
         ),
         "Unable to parse value[notnumber] for field[val]",
-        "could not convert value [notnumber] to float",
-        "could not convert value [notnumber] to long",
+        "Could not convert value [notnumber] to float for dimension [dimFloat].",
+        "Could not convert value [notnumber] to long for dimension [dimLong].",
         StringUtils.format(
             "Timestamp[unparseable] is unparseable! Event: {time=unparseable, dim=a, dimLong=2, dimFloat=3.0, val=1} (Path: %s, Record: 1, Line: 1)",
             tmpFile.toURI()
diff --git a/processing/src/main/java/org/apache/druid/segment/DimensionHandlerUtils.java b/processing/src/main/java/org/apache/druid/segment/DimensionHandlerUtils.java
index da63413cb4b..e129ceb4177 100644
--- a/processing/src/main/java/org/apache/druid/segment/DimensionHandlerUtils.java
+++ b/processing/src/main/java/org/apache/druid/segment/DimensionHandlerUtils.java
@@ -28,6 +28,7 @@ import org.apache.druid.data.input.impl.DimensionSchema.MultiValueHandling;
 import org.apache.druid.error.DruidException;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.parsers.ParseException;
 import org.apache.druid.math.expr.Evals;
 import org.apache.druid.query.ColumnSelectorPlus;
@@ -309,13 +310,11 @@ public final class DimensionHandlerUtils
   }
 
   @Nullable
-  public static Long convertObjectToLong(@Nullable Object valObj)
-  {
-    return convertObjectToLong(valObj, false);
-  }
-
-  @Nullable
-  public static Long convertObjectToLong(@Nullable Object valObj, boolean reportParseExceptions)
+  public static Long convertObjectToLong(
+      @Nullable Object valObj,
+      boolean reportParseExceptions,
+      @Nullable String objectKey
+  )
   {
     if (valObj == null) {
       return null;
@@ -330,25 +329,82 @@ public final class DimensionHandlerUtils
     } else if (valObj instanceof String) {
       Long ret = DimensionHandlerUtils.getExactLongFromDecimalString((String) valObj);
       if (reportParseExceptions && ret == null) {
-        throw new ParseException((String) valObj, "could not convert value [%s] to long", valObj);
+        final String message;
+        if (objectKey != null) {
+          message = StringUtils.nonStrictFormat(
+              "Could not convert value [%s] to long for dimension [%s].",
+              valObj,
+              objectKey
+          );
+        } else {
+          message = StringUtils.nonStrictFormat(
+              "Could not convert value [%s] to long.",
+              valObj
+          );
+        }
+        throw new ParseException((String) valObj, message);
       }
       return ret;
     } else if (valObj instanceof List) {
+      final String message;
+      if (objectKey != null) {
+        message = StringUtils.nonStrictFormat(
+            "Could not ingest value [%s] as long for dimension [%s]. A long column cannot have multiple values in the same row.",
+            valObj,
+            objectKey
+        );
+      } else {
+        message = StringUtils.nonStrictFormat(
+            "Could not ingest value [%s] as long. A long column cannot have multiple values in the same row.",
+            valObj
+        );
+      }
       throw new ParseException(
           valObj.getClass().toString(),
-          "Could not ingest value %s as long. A long column cannot have multiple values in the same row.",
-          valObj
+          message
       );
     } else {
+      final String message;
+      if (objectKey != null) {
+        message = StringUtils.nonStrictFormat(
+            "Could not convert value [%s] to long for dimension [%s]. Invalid type: [%s]",
+            valObj,
+            objectKey,
+            valObj.getClass()
+        );
+      } else {
+        message = StringUtils.nonStrictFormat(
+            valObj.getClass().toString(),
+            "Could not convert value [%s] to long. Invalid type: [%s]",
+            valObj,
+            valObj.getClass()
+        );
+      }
       throw new ParseException(
           valObj.getClass().toString(),
-          "Could not convert value [%s] to long. Invalid type: [%s]",
-          valObj,
-          valObj.getClass()
+          message
       );
     }
   }
 
+  @Nullable
+  public static Long convertObjectToLong(@Nullable Object valObj)
+  {
+    return convertObjectToLong(valObj, false);
+  }
+
+  @Nullable
+  public static Long convertObjectToLong(@Nullable Object valObj, boolean reportParseExceptions)
+  {
+    return convertObjectToLong(valObj, reportParseExceptions, null);
+  }
+
+  @Nullable
+  public static Long convertObjectToLong(@Nullable Object valObj, @Nullable String fieldName)
+  {
+    return convertObjectToLong(valObj, false, fieldName);
+  }
+
   @Nullable
   public static Float convertObjectToFloat(@Nullable Object valObj)
   {
@@ -358,33 +414,118 @@ public final class DimensionHandlerUtils
   @Nullable
   public static Float convertObjectToFloat(@Nullable Object valObj, boolean reportParseExceptions)
   {
-    if (valObj == null) {
-      return null;
-    }
+    return convertObjectToFloat(valObj, reportParseExceptions, null);
+  }
 
-    if (valObj instanceof Float) {
-      return (Float) valObj;
-    } else if (valObj instanceof Number) {
-      return ((Number) valObj).floatValue();
-    } else if (valObj instanceof String) {
-      Float ret = Floats.tryParse((String) valObj);
-      if (reportParseExceptions && ret == null) {
-        throw new ParseException((String) valObj, "could not convert value [%s] to float", valObj);
+  @Nullable
+  public static Float convertObjectToFloat(@Nullable Object valObj, @Nullable String fieldName)
+  {
+    return convertObjectToFloat(valObj, false, fieldName);
+  }
+
+  @Nullable
+  public static Float convertObjectToFloat(@Nullable Object valObj, boolean reportParseExceptions, @Nullable String fieldName)
+  {
+    {
+      if (valObj == null) {
+        return null;
       }
-      return ret;
-    } else if (valObj instanceof List) {
-      throw new ParseException(
-          valObj.getClass().toString(),
-          "Could not ingest value %s as float. A float column cannot have multiple values in the same row.",
-          valObj
-      );
-    } else {
-      throw new ParseException(
-          valObj.getClass().toString(),
-          "Could not convert value [%s] to float. Invalid type: [%s]",
-          valObj,
-          valObj.getClass()
-      );
+
+      if (valObj instanceof Float) {
+        return (Float) valObj;
+      } else if (valObj instanceof Number) {
+        return ((Number) valObj).floatValue();
+      } else if (valObj instanceof String) {
+        Float ret = Floats.tryParse((String) valObj);
+        if (reportParseExceptions && ret == null) {
+          final String message;
+          if (fieldName != null) {
+            message = StringUtils.nonStrictFormat(
+                "Could not convert value [%s] to float for dimension [%s].",
+                valObj,
+                fieldName
+            );
+          } else {
+            message = StringUtils.nonStrictFormat(
+                "Could not convert value [%s] to float.",
+                valObj
+            );
+          }
+          throw new ParseException((String) valObj, message);
+        }
+        return ret;
+      } else if (valObj instanceof List) {
+        final String message;
+        if (fieldName != null) {
+          message = StringUtils.nonStrictFormat(
+              "Could not ingest value [%s] as float for dimension [%s]. A float column cannot have multiple values in the same row.",
+              valObj,
+              fieldName
+          );
+        } else {
+          message = StringUtils.nonStrictFormat(
+              "Could not ingest value [%s] as float. A float column cannot have multiple values in the same row.",
+              valObj
+          );
+        }
+        throw new ParseException(
+            valObj.getClass().toString(),
+            message
+        );
+      } else {
+        final String message;
+        if (fieldName != null) {
+          message = StringUtils.nonStrictFormat(
+              "Could not convert value [%s] to float for dimension [%s]. Invalid type: [%s]",
+              valObj,
+              fieldName,
+              valObj.getClass()
+          );
+        } else {
+          message = StringUtils.nonStrictFormat(
+              "Could not convert value [%s] to float. Invalid type: [%s]",
+              valObj,
+              valObj.getClass()
+          );
+        }
+        throw new ParseException(
+            valObj.getClass().toString(),
+            message
+        );
+      }
+    }
+  }
+
+  @Nullable
+  public static Object convertObjectToType(
+      @Nullable final Object obj,
+      final TypeSignature<ValueType> type,
+      final boolean reportParseExceptions,
+      @Nullable final String fieldName
+  )
+  {
+    Preconditions.checkNotNull(type, "type");
+
+    switch (type.getType()) {
+      case LONG:
+        return convertObjectToLong(obj, reportParseExceptions, fieldName);
+      case FLOAT:
+        return convertObjectToFloat(obj, reportParseExceptions, fieldName);
+      case DOUBLE:
+        return convertObjectToDouble(obj, reportParseExceptions, fieldName);
+      case STRING:
+        return convertObjectToString(obj);
+      case ARRAY:
+        return coerceToObjectArrayWithElementCoercionFunction(
+            obj,
+            x -> DimensionHandlerUtils.convertObjectToType(x, type.getElementType(), reportParseExceptions, fieldName)
+        );
+      case COMPLEX:
+        // Can't coerce complex objects, and we shouldn't need to. If in future selectors behave weirdly, or we need to
+        // cast them (for some unknown reason), we can have that casting knowledge in the type strategy
+        return obj;
+      default:
+        throw DruidException.defensive("Type[%s] is not supported for dimensions!", type);
     }
   }
 
@@ -395,29 +536,7 @@ public final class DimensionHandlerUtils
       final boolean reportParseExceptions
   )
   {
-    Preconditions.checkNotNull(type, "type");
-
-    switch (type.getType()) {
-      case LONG:
-        return convertObjectToLong(obj, reportParseExceptions);
-      case FLOAT:
-        return convertObjectToFloat(obj, reportParseExceptions);
-      case DOUBLE:
-        return convertObjectToDouble(obj, reportParseExceptions);
-      case STRING:
-        return convertObjectToString(obj);
-      case ARRAY:
-        return coerceToObjectArrayWithElementCoercionFunction(
-            obj,
-            x -> DimensionHandlerUtils.convertObjectToType(x, type.getElementType())
-        );
-      case COMPLEX:
-        // Can't coerce complex objects, and we shouldn't need to. If in future selectors behave weirdly, or we need to
-        // cast them (for some unknown reason), we can have that casting knowledge in the type strategy
-        return obj;
-      default:
-        throw DruidException.defensive("Type[%s] is not supported for dimensions!", type);
-    }
+    return convertObjectToType(obj, type, reportParseExceptions, null);
   }
 
   @Nullable
@@ -506,6 +625,18 @@ public final class DimensionHandlerUtils
 
   @Nullable
   public static Double convertObjectToDouble(@Nullable Object valObj, boolean reportParseExceptions)
+  {
+    return convertObjectToDouble(valObj, reportParseExceptions, null);
+  }
+
+  @Nullable
+  public static Double convertObjectToDouble(@Nullable Object valObj, @Nullable String fieldName)
+  {
+    return convertObjectToDouble(valObj, false, fieldName);
+  }
+
+  @Nullable
+  public static Double convertObjectToDouble(@Nullable Object valObj, boolean reportParseExceptions, @Nullable String fieldName)
   {
     if (valObj == null) {
       return null;
@@ -518,21 +649,59 @@ public final class DimensionHandlerUtils
     } else if (valObj instanceof String) {
       Double ret = Doubles.tryParse((String) valObj);
       if (reportParseExceptions && ret == null) {
-        throw new ParseException((String) valObj, "could not convert value [%s] to double", valObj);
+        final String message;
+        if (fieldName != null) {
+          message = StringUtils.nonStrictFormat(
+              "Could not convert value [%s] to double for dimension [%s].",
+              valObj,
+              fieldName
+          );
+        } else {
+          message = StringUtils.nonStrictFormat(
+              "Could not convert value [%s] to double.",
+              valObj
+          );
+        }
+        throw new ParseException((String) valObj, message);
       }
       return ret;
     } else if (valObj instanceof List) {
+      final String message;
+      if (fieldName != null) {
+        message = StringUtils.nonStrictFormat(
+            "Could not ingest value [%s] as double for dimension [%s]. A double column cannot have multiple values in the same row.",
+            valObj,
+            fieldName
+        );
+      } else {
+        message = StringUtils.nonStrictFormat(
+            "Could not ingest value [%s] as double. A double column cannot have multiple values in the same row.",
+            valObj
+        );
+      }
+
       throw new ParseException(
           valObj.getClass().toString(),
-          "Could not ingest value %s as double. A double column cannot have multiple values in the same row.",
-          valObj
+          message
       );
     } else {
+      final String message;
+      if (fieldName != null) {
+        message = StringUtils.nonStrictFormat(
+            "Could not convert value [%s] to double for dimension [%s]. Invalid type: [%s]",
+            valObj,
+            fieldName,
+            valObj.getClass()
+        );
+      } else {
+        message = StringUtils.nonStrictFormat(
+            "Could not convert value [%s] to double. Invalid type: [%s]",
+            valObj, valObj.getClass()
+        );
+      }
       throw new ParseException(
           valObj.getClass().toString(),
-          "Could not convert value [%s] to double. Invalid type: [%s]",
-          valObj,
-          valObj.getClass()
+          message
       );
     }
   }
diff --git a/processing/src/main/java/org/apache/druid/segment/DoubleDimensionHandler.java b/processing/src/main/java/org/apache/druid/segment/DoubleDimensionHandler.java
index 9fbc9436be6..e8166708922 100644
--- a/processing/src/main/java/org/apache/druid/segment/DoubleDimensionHandler.java
+++ b/processing/src/main/java/org/apache/druid/segment/DoubleDimensionHandler.java
@@ -72,7 +72,7 @@ public class DoubleDimensionHandler implements DimensionHandler<Double, Double,
   @Override
   public DimensionIndexer<Double, Double, Double> makeIndexer(boolean useMaxMemoryEstimates)
   {
-    return new DoubleDimensionIndexer();
+    return new DoubleDimensionIndexer(dimensionName);
   }
 
   @Override
diff --git a/processing/src/main/java/org/apache/druid/segment/DoubleDimensionIndexer.java b/processing/src/main/java/org/apache/druid/segment/DoubleDimensionIndexer.java
index f4e13cca565..6f1e5184747 100644
--- a/processing/src/main/java/org/apache/druid/segment/DoubleDimensionIndexer.java
+++ b/processing/src/main/java/org/apache/druid/segment/DoubleDimensionIndexer.java
@@ -39,13 +39,21 @@ import java.util.Objects;
 public class DoubleDimensionIndexer implements DimensionIndexer<Double, Double, Double>
 {
   public static final Comparator<Double> DOUBLE_COMPARATOR = Comparators.naturalNullsFirst();
-
+  private final String dimensionName;
   private volatile boolean hasNulls = false;
 
-  @Override
-  public EncodedKeyComponent<Double> processRowValsToUnsortedEncodedKeyComponent(@Nullable Object dimValues, boolean reportParseExceptions)
+  public DoubleDimensionIndexer(String dimensionName)
   {
-    Double d = DimensionHandlerUtils.convertObjectToDouble(dimValues, reportParseExceptions);
+    this.dimensionName = dimensionName;
+  }
+
+  @Override
+  public EncodedKeyComponent<Double> processRowValsToUnsortedEncodedKeyComponent(
+      @Nullable Object dimValues,
+      boolean reportParseExceptions
+  )
+  {
+    Double d = DimensionHandlerUtils.convertObjectToDouble(dimValues, reportParseExceptions, dimensionName);
     if (d == null) {
       hasNulls = NullHandling.sqlCompatible();
     }
diff --git a/processing/src/main/java/org/apache/druid/segment/FloatDimensionHandler.java b/processing/src/main/java/org/apache/druid/segment/FloatDimensionHandler.java
index 4763b0e8be1..8d3471a4d92 100644
--- a/processing/src/main/java/org/apache/druid/segment/FloatDimensionHandler.java
+++ b/processing/src/main/java/org/apache/druid/segment/FloatDimensionHandler.java
@@ -72,7 +72,7 @@ public class FloatDimensionHandler implements DimensionHandler<Float, Float, Flo
   @Override
   public DimensionIndexer<Float, Float, Float> makeIndexer(boolean useMaxMemoryEstimates)
   {
-    return new FloatDimensionIndexer();
+    return new FloatDimensionIndexer(dimensionName);
   }
 
   @Override
diff --git a/processing/src/main/java/org/apache/druid/segment/FloatDimensionIndexer.java b/processing/src/main/java/org/apache/druid/segment/FloatDimensionIndexer.java
index be5e86b7bb6..16b3c9f7052 100644
--- a/processing/src/main/java/org/apache/druid/segment/FloatDimensionIndexer.java
+++ b/processing/src/main/java/org/apache/druid/segment/FloatDimensionIndexer.java
@@ -39,13 +39,21 @@ import java.util.Objects;
 public class FloatDimensionIndexer implements DimensionIndexer<Float, Float, Float>
 {
   public static final Comparator<Float> FLOAT_COMPARATOR = Comparators.naturalNullsFirst();
-
+  private final String dimensionName;
   private volatile boolean hasNulls = false;
 
-  @Override
-  public EncodedKeyComponent<Float> processRowValsToUnsortedEncodedKeyComponent(@Nullable Object dimValues, boolean reportParseExceptions)
+  public FloatDimensionIndexer(String dimensionName)
   {
-    Float f = DimensionHandlerUtils.convertObjectToFloat(dimValues, reportParseExceptions);
+    this.dimensionName = dimensionName;
+  }
+
+  @Override
+  public EncodedKeyComponent<Float> processRowValsToUnsortedEncodedKeyComponent(
+      @Nullable Object dimValues,
+      boolean reportParseExceptions
+  )
+  {
+    Float f = DimensionHandlerUtils.convertObjectToFloat(dimValues, reportParseExceptions, dimensionName);
     if (f == null) {
       hasNulls = NullHandling.sqlCompatible();
     }
diff --git a/processing/src/main/java/org/apache/druid/segment/LongDimensionHandler.java b/processing/src/main/java/org/apache/druid/segment/LongDimensionHandler.java
index 51e13396840..64a9f98cd44 100644
--- a/processing/src/main/java/org/apache/druid/segment/LongDimensionHandler.java
+++ b/processing/src/main/java/org/apache/druid/segment/LongDimensionHandler.java
@@ -72,7 +72,7 @@ public class LongDimensionHandler implements DimensionHandler<Long, Long, Long>
   @Override
   public DimensionIndexer<Long, Long, Long> makeIndexer(boolean useMaxMemoryEstimates)
   {
-    return new LongDimensionIndexer();
+    return new LongDimensionIndexer(dimensionName);
   }
 
   @Override
diff --git a/processing/src/main/java/org/apache/druid/segment/LongDimensionIndexer.java b/processing/src/main/java/org/apache/druid/segment/LongDimensionIndexer.java
index 85ed29b9c28..3b273bb7f02 100644
--- a/processing/src/main/java/org/apache/druid/segment/LongDimensionIndexer.java
+++ b/processing/src/main/java/org/apache/druid/segment/LongDimensionIndexer.java
@@ -39,13 +39,21 @@ import java.util.Objects;
 public class LongDimensionIndexer implements DimensionIndexer<Long, Long, Long>
 {
   public static final Comparator<Long> LONG_COMPARATOR = Comparators.naturalNullsFirst();
-
+  private final String dimensionName;
   private volatile boolean hasNulls = false;
 
-  @Override
-  public EncodedKeyComponent<Long> processRowValsToUnsortedEncodedKeyComponent(@Nullable Object dimValues, boolean reportParseExceptions)
+  public LongDimensionIndexer(String dimensionName)
   {
-    Long l = DimensionHandlerUtils.convertObjectToLong(dimValues, reportParseExceptions);
+    this.dimensionName = dimensionName;
+  }
+
+  @Override
+  public EncodedKeyComponent<Long> processRowValsToUnsortedEncodedKeyComponent(
+      @Nullable Object dimValues,
+      boolean reportParseExceptions
+  )
+  {
+    Long l = DimensionHandlerUtils.convertObjectToLong(dimValues, reportParseExceptions, dimensionName);
     if (l == null) {
       hasNulls = NullHandling.sqlCompatible();
     }
diff --git a/processing/src/test/java/org/apache/druid/segment/incremental/IncrementalIndexTest.java b/processing/src/test/java/org/apache/druid/segment/incremental/IncrementalIndexTest.java
index c83c4f0da4c..067c078f5bc 100644
--- a/processing/src/test/java/org/apache/druid/segment/incremental/IncrementalIndexTest.java
+++ b/processing/src/test/java/org/apache/druid/segment/incremental/IncrementalIndexTest.java
@@ -197,7 +197,7 @@ public class IncrementalIndexTest extends InitializedNullHandlingTest
         result.getParseException().getInput()
     );
     Assert.assertEquals(
-        "Found unparseable columns in row: [{string=A, float=19.0, long=asdj, double=21.0}], exceptions: [could not convert value [asdj] to long]",
+        "Found unparseable columns in row: [{string=A, float=19.0, long=asdj, double=21.0}], exceptions: [Could not convert value [asdj] to long for dimension [long].]",
         result.getParseException().getMessage()
     );
 
@@ -219,7 +219,7 @@ public class IncrementalIndexTest extends InitializedNullHandlingTest
         result.getParseException().getInput()
     );
     Assert.assertEquals(
-        "Found unparseable columns in row: [{string=A, float=aaa, long=20, double=21.0}], exceptions: [could not convert value [aaa] to float]",
+        "Found unparseable columns in row: [{string=A, float=aaa, long=20, double=21.0}], exceptions: [Could not convert value [aaa] to float for dimension [float].]",
         result.getParseException().getMessage()
     );
 
@@ -241,7 +241,7 @@ public class IncrementalIndexTest extends InitializedNullHandlingTest
         result.getParseException().getInput()
     );
     Assert.assertEquals(
-        "Found unparseable columns in row: [{string=A, float=19.0, long=20, double=}], exceptions: [could not convert value [] to double]",
+        "Found unparseable columns in row: [{string=A, float=19.0, long=20, double=}], exceptions: [Could not convert value [] to double for dimension [double].]",
         result.getParseException().getMessage()
     );
   }
@@ -270,7 +270,7 @@ public class IncrementalIndexTest extends InitializedNullHandlingTest
         result.getParseException().getInput()
     );
     Assert.assertEquals(
-        "Found unparseable columns in row: [{string=A, float=19.0, long=[10, 5], double=21.0}], exceptions: [Could not ingest value [10, 5] as long. A long column cannot have multiple values in the same row.]",
+        "Found unparseable columns in row: [{string=A, float=19.0, long=[10, 5], double=21.0}], exceptions: [Could not ingest value [[10, 5]] as long for dimension [long]. A long column cannot have multiple values in the same row.]",
         result.getParseException().getMessage()
     );
 
@@ -292,7 +292,7 @@ public class IncrementalIndexTest extends InitializedNullHandlingTest
         result.getParseException().getInput()
     );
     Assert.assertEquals(
-        "Found unparseable columns in row: [{string=A, float=[10.0, 5.0], long=20, double=21.0}], exceptions: [Could not ingest value [10.0, 5.0] as float. A float column cannot have multiple values in the same row.]",
+        "Found unparseable columns in row: [{string=A, float=[10.0, 5.0], long=20, double=21.0}], exceptions: [Could not ingest value [[10.0, 5.0]] as float for dimension [float]. A float column cannot have multiple values in the same row.]",
         result.getParseException().getMessage()
     );
 
@@ -314,7 +314,7 @@ public class IncrementalIndexTest extends InitializedNullHandlingTest
         result.getParseException().getInput()
     );
     Assert.assertEquals(
-        "Found unparseable columns in row: [{string=A, float=19.0, long=20, double=[10.0, 5.0]}], exceptions: [Could not ingest value [10.0, 5.0] as double. A double column cannot have multiple values in the same row.]",
+        "Found unparseable columns in row: [{string=A, float=19.0, long=20, double=[10.0, 5.0]}], exceptions: [Could not ingest value [[10.0, 5.0]] as double for dimension [double]. A double column cannot have multiple values in the same row.]",
         result.getParseException().getMessage()
     );
   }
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/run/SqlResults.java b/sql/src/main/java/org/apache/druid/sql/calcite/run/SqlResults.java
index 486c23f67c9..38b3ab1fd89 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/run/SqlResults.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/run/SqlResults.java
@@ -114,21 +114,21 @@ public class SqlResults
       }
     } else if (sqlTypeName == SqlTypeName.BIGINT) {
       try {
-        coercedValue = DimensionHandlerUtils.convertObjectToLong(value);
+        coercedValue = DimensionHandlerUtils.convertObjectToLong(value, fieldName);
       }
       catch (Exception e) {
         throw cannotCoerce(value, sqlTypeName, fieldName);
       }
     } else if (sqlTypeName == SqlTypeName.FLOAT) {
       try {
-        coercedValue = DimensionHandlerUtils.convertObjectToFloat(value);
+        coercedValue = DimensionHandlerUtils.convertObjectToFloat(value, fieldName);
       }
       catch (Exception e) {
         throw cannotCoerce(value, sqlTypeName, fieldName);
       }
     } else if (SqlTypeName.FRACTIONAL_TYPES.contains(sqlTypeName)) {
       try {
-        coercedValue = DimensionHandlerUtils.convertObjectToDouble(value);
+        coercedValue = DimensionHandlerUtils.convertObjectToDouble(value, fieldName);
       }
       catch (Exception e) {
         throw cannotCoerce(value, sqlTypeName, fieldName);

From d9bd02256ab3a9c393e97d2da709f7395293547f Mon Sep 17 00:00:00 2001
From: Kashif Faraz <kashif.faraz@gmail.com>
Date: Tue, 25 Jun 2024 22:18:59 -0700
Subject: [PATCH 24/72] Refactor: Rename UsedSegmentChecker and cleanup task
 actions (#16644)

Changes:
- Rename `UsedSegmentChecker` to `PublishedSegmentsRetriever`
- Remove deprecated single `Interval` argument from `RetrieveUsedSegmentsAction`
as it is now unused and has been deprecated since #1988
- Return `Set` of segments instead of a `Collection` from `IndexerMetadataStorageCoordinator.retrieveUsedSegments()`
---
 ...ActionBasedPublishedSegmentRetriever.java} |  10 +-
 .../actions/RetrieveUsedSegmentsAction.java   |  50 +++-----
 .../indexing/common/actions/TaskAction.java   |   2 +-
 .../common/task/BatchAppenderators.java       |   4 +-
 .../common/task/KillUnusedSegmentsTask.java   |   1 -
 ...rlordActionBasedUsedSegmentsRetriever.java |   2 +-
 .../SeekableStreamIndexTask.java              |   4 +-
 .../SeekableStreamIndexTaskRunner.java        |   2 +-
 .../seekablestream/SequenceMetadata.java      |  16 +--
 ...onBasedPublishedSegmentRetrieverTest.java} |   7 +-
 .../RetrieveUsedSegmentsActionSerdeTest.java  |  11 +-
 .../SegmentTransactionalInsertActionTest.java |  25 ++--
 .../ConcurrentReplaceAndAppendTest.java       |   1 -
 ...ncurrentReplaceAndStreamingAppendTest.java |   2 -
 ...TestIndexerMetadataStorageCoordinator.java |   8 +-
 .../druid/common/config/ConfigManager.java    |   6 +-
 .../IndexerMetadataStorageCoordinator.java    |  68 +++--------
 .../IndexerSQLMetadataStorageCoordinator.java | 107 ++++++------------
 .../druid/metadata/SQLMetadataConnector.java  |   2 +-
 .../appenderator/BaseAppenderatorDriver.java  |   8 +-
 .../appenderator/BatchAppenderatorDriver.java |  10 +-
 ...er.java => PublishedSegmentRetriever.java} |   2 +-
 .../StreamAppenderatorDriver.java             |   8 +-
 ...exerSQLMetadataStorageCoordinatorTest.java |   4 +-
 ...mentsSinksBatchAppenderatorDriverTest.java |   2 +-
 ...edSegmentsBatchAppenderatorDriverTest.java |   2 +-
 .../StreamAppenderatorDriverFailTest.java     |  15 +--
 .../StreamAppenderatorDriverTest.java         |   2 +-
 ...ava => TestPublishedSegmentRetriever.java} |   4 +-
 29 files changed, 137 insertions(+), 248 deletions(-)
 rename indexing-service/src/main/java/org/apache/druid/indexing/appenderator/{ActionBasedUsedSegmentChecker.java => ActionBasedPublishedSegmentRetriever.java} (89%)
 rename indexing-service/src/test/java/org/apache/druid/indexing/appenderator/{ActionBasedUsedSegmentCheckerTest.java => ActionBasedPublishedSegmentRetrieverTest.java} (96%)
 rename server/src/main/java/org/apache/druid/segment/realtime/appenderator/{UsedSegmentChecker.java => PublishedSegmentRetriever.java} (96%)
 rename server/src/test/java/org/apache/druid/segment/realtime/appenderator/{TestUsedSegmentChecker.java => TestPublishedSegmentRetriever.java} (92%)

diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentChecker.java b/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetriever.java
similarity index 89%
rename from indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentChecker.java
rename to indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetriever.java
index 2a7d5610cca..ba5cf923b12 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentChecker.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetriever.java
@@ -27,7 +27,7 @@ import org.apache.druid.indexing.common.actions.TaskActionClient;
 import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.java.util.common.JodaUtils;
 import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.segment.realtime.appenderator.UsedSegmentChecker;
+import org.apache.druid.segment.realtime.appenderator.PublishedSegmentRetriever;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.SegmentId;
 import org.joda.time.Interval;
@@ -40,13 +40,13 @@ import java.util.List;
 import java.util.Set;
 import java.util.stream.Collectors;
 
-public class ActionBasedUsedSegmentChecker implements UsedSegmentChecker
+public class ActionBasedPublishedSegmentRetriever implements PublishedSegmentRetriever
 {
-  private static final Logger log = new Logger(ActionBasedUsedSegmentChecker.class);
+  private static final Logger log = new Logger(ActionBasedPublishedSegmentRetriever.class);
 
   private final TaskActionClient taskActionClient;
 
-  public ActionBasedUsedSegmentChecker(TaskActionClient taskActionClient)
+  public ActionBasedPublishedSegmentRetriever(TaskActionClient taskActionClient)
   {
     this.taskActionClient = taskActionClient;
   }
@@ -92,7 +92,7 @@ public class ActionBasedUsedSegmentChecker implements UsedSegmentChecker
         Iterables.transform(segmentIds, SegmentId::getInterval)
     );
     final Collection<DataSegment> foundUsedSegments = taskActionClient.submit(
-        new RetrieveUsedSegmentsAction(dataSource, null, usedSearchIntervals, Segments.INCLUDING_OVERSHADOWED)
+        new RetrieveUsedSegmentsAction(dataSource, usedSearchIntervals, Segments.INCLUDING_OVERSHADOWED)
     );
     for (DataSegment segment : foundUsedSegments) {
       if (segmentIds.contains(segment.getId())) {
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUsedSegmentsAction.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUsedSegmentsAction.java
index 4e5f134c521..a107795864c 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUsedSegmentsAction.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUsedSegmentsAction.java
@@ -22,8 +22,8 @@ package org.apache.druid.indexing.common.actions;
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.fasterxml.jackson.core.type.TypeReference;
-import com.google.common.base.Preconditions;
-import com.google.common.collect.ImmutableList;
+import org.apache.druid.common.config.Configs;
+import org.apache.druid.error.InvalidInput;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.indexing.common.task.batch.parallel.AbstractBatchSubtask;
 import org.apache.druid.indexing.overlord.Segments;
@@ -35,6 +35,7 @@ import org.apache.druid.metadata.ReplaceTaskLock;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.Partitions;
 import org.apache.druid.timeline.SegmentTimeline;
+import org.apache.druid.utils.CollectionUtils;
 import org.joda.time.Interval;
 
 import javax.annotation.Nullable;
@@ -48,19 +49,13 @@ import java.util.Set;
 import java.util.stream.Collectors;
 
 /**
- * This TaskAction returns a collection of segments which have data within the specified intervals and are marked as
- * used.
+ * Task action to retrieve a collection of segments which have data within the
+ * specified intervals and are marked as used.
+ * <p>
  * If the task holds REPLACE locks and is writing back to the same datasource,
- * only segments that were created before the REPLACE lock was acquired are returned for an interval.
- * This ensures that the input set of segments for this replace task remains consistent
- * even when new data is appended by other concurrent tasks.
- *
- * The order of segments within the returned collection is unspecified, but each segment is guaranteed to appear in
- * the collection only once.
- *
- * @implNote This action doesn't produce a {@link Set} because it's implemented via {@link
- * org.apache.druid.indexing.overlord.IndexerMetadataStorageCoordinator#retrieveUsedSegmentsForIntervals} which returns
- * a collection. Producing a {@link Set} would require an unnecessary copy of segments collection.
+ * only segments that were created before the REPLACE lock was acquired are
+ * returned for an interval. This ensures that the input set of segments for this
+ * replace task remains consistent even when new data is appended by other concurrent tasks.
  */
 public class RetrieveUsedSegmentsAction implements TaskAction<Collection<DataSegment>>
 {
@@ -73,35 +68,22 @@ public class RetrieveUsedSegmentsAction implements TaskAction<Collection<DataSeg
   @JsonCreator
   public RetrieveUsedSegmentsAction(
       @JsonProperty("dataSource") String dataSource,
-      @Deprecated @JsonProperty("interval") Interval interval,
       @JsonProperty("intervals") Collection<Interval> intervals,
-      // When JSON object is deserialized, this parameter is optional for backward compatibility.
-      // Otherwise, it shouldn't be considered optional.
       @JsonProperty("visibility") @Nullable Segments visibility
   )
   {
-    this.dataSource = dataSource;
-
-    Preconditions.checkArgument(
-        interval == null || intervals == null,
-        "please specify intervals only"
-    );
-
-    List<Interval> theIntervals = null;
-    if (interval != null) {
-      theIntervals = ImmutableList.of(interval);
-    } else if (intervals != null && intervals.size() > 0) {
-      theIntervals = JodaUtils.condenseIntervals(intervals);
+    if (CollectionUtils.isNullOrEmpty(intervals)) {
+      throw InvalidInput.exception("No interval specified for retrieving used segments");
     }
-    this.intervals = Preconditions.checkNotNull(theIntervals, "no intervals found");
 
-    // Defaulting to the former behaviour when visibility wasn't explicitly specified for backward compatibility
-    this.visibility = visibility != null ? visibility : Segments.ONLY_VISIBLE;
+    this.dataSource = dataSource;
+    this.intervals = JodaUtils.condenseIntervals(intervals);
+    this.visibility = Configs.valueOrDefault(visibility, Segments.ONLY_VISIBLE);
   }
 
   public RetrieveUsedSegmentsAction(String dataSource, Collection<Interval> intervals)
   {
-    this(dataSource, null, intervals, Segments.ONLY_VISIBLE);
+    this(dataSource, intervals, Segments.ONLY_VISIBLE);
   }
 
   @JsonProperty
@@ -198,7 +180,7 @@ public class RetrieveUsedSegmentsAction implements TaskAction<Collection<DataSeg
     }
   }
 
-  private Collection<DataSegment> retrieveUsedSegments(TaskActionToolbox toolbox)
+  private Set<DataSegment> retrieveUsedSegments(TaskActionToolbox toolbox)
   {
     return toolbox.getIndexerMetadataStorageCoordinator()
                   .retrieveUsedSegmentsForIntervals(dataSource, intervals, visibility);
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
index 7ab0b946cd8..4606bd597a8 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
@@ -38,7 +38,7 @@ import java.util.concurrent.Future;
     @JsonSubTypes.Type(name = "segmentTransactionalInsert", value = SegmentTransactionalInsertAction.class),
     @JsonSubTypes.Type(name = "segmentTransactionalAppend", value = SegmentTransactionalAppendAction.class),
     @JsonSubTypes.Type(name = "segmentTransactionalReplace", value = SegmentTransactionalReplaceAction.class),
-    @JsonSubTypes.Type(name = "segmentListById", value = RetrieveSegmentsByIdAction.class),
+    @JsonSubTypes.Type(name = "retrieveSegmentsById", value = RetrieveSegmentsByIdAction.class),
     @JsonSubTypes.Type(name = "segmentListUsed", value = RetrieveUsedSegmentsAction.class),
     @JsonSubTypes.Type(name = "segmentListUnused", value = RetrieveUnusedSegmentsAction.class),
     @JsonSubTypes.Type(name = "markSegmentsAsUnused", value = MarkSegmentsAsUnusedAction.class),
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/BatchAppenderators.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/BatchAppenderators.java
index 3a8f70d6746..087464b48ac 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/BatchAppenderators.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/BatchAppenderators.java
@@ -19,7 +19,7 @@
 
 package org.apache.druid.indexing.common.task;
 
-import org.apache.druid.indexing.appenderator.ActionBasedUsedSegmentChecker;
+import org.apache.druid.indexing.appenderator.ActionBasedPublishedSegmentRetriever;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.config.TaskConfig;
 import org.apache.druid.java.util.common.IAE;
@@ -134,7 +134,7 @@ public final class BatchAppenderators
     return new BatchAppenderatorDriver(
         appenderator,
         segmentAllocator,
-        new ActionBasedUsedSegmentChecker(toolbox.getTaskActionClient()),
+        new ActionBasedPublishedSegmentRetriever(toolbox.getTaskActionClient()),
         toolbox.getDataSegmentKiller()
     );
   }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTask.java
index 6a1f9e95a06..fe49569a3bb 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTask.java
@@ -198,7 +198,6 @@ public class KillUnusedSegmentsTask extends AbstractFixedIntervalTask
 
     RetrieveUsedSegmentsAction retrieveUsedSegmentsAction = new RetrieveUsedSegmentsAction(
             getDataSource(),
-            null,
             ImmutableList.of(getInterval()),
             Segments.INCLUDING_OVERSHADOWED
     );
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/hadoop/OverlordActionBasedUsedSegmentsRetriever.java b/indexing-service/src/main/java/org/apache/druid/indexing/hadoop/OverlordActionBasedUsedSegmentsRetriever.java
index 73bc411fb01..e6e9ad7170b 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/hadoop/OverlordActionBasedUsedSegmentsRetriever.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/hadoop/OverlordActionBasedUsedSegmentsRetriever.java
@@ -53,6 +53,6 @@ public class OverlordActionBasedUsedSegmentsRetriever implements UsedSegmentsRet
   {
     return toolbox
         .getTaskActionClient()
-        .submit(new RetrieveUsedSegmentsAction(dataSource, null, intervals, visibility));
+        .submit(new RetrieveUsedSegmentsAction(dataSource, intervals, visibility));
   }
 }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTask.java
index f8e78bb711d..ee4eed572df 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTask.java
@@ -27,8 +27,8 @@ import com.google.common.base.Suppliers;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.data.input.impl.ByteEntity;
 import org.apache.druid.indexer.TaskStatus;
+import org.apache.druid.indexing.appenderator.ActionBasedPublishedSegmentRetriever;
 import org.apache.druid.indexing.appenderator.ActionBasedSegmentAllocator;
-import org.apache.druid.indexing.appenderator.ActionBasedUsedSegmentChecker;
 import org.apache.druid.indexing.common.LockGranularity;
 import org.apache.druid.indexing.common.TaskLockType;
 import org.apache.druid.indexing.common.TaskToolbox;
@@ -237,7 +237,7 @@ public abstract class SeekableStreamIndexTask<PartitionIdType, SequenceOffsetTyp
             )
         ),
         toolbox.getSegmentHandoffNotifierFactory(),
-        new ActionBasedUsedSegmentChecker(toolbox.getTaskActionClient()),
+        new ActionBasedPublishedSegmentRetriever(toolbox.getTaskActionClient()),
         toolbox.getDataSegmentKiller(),
         toolbox.getJsonMapper(),
         metrics
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java
index 2fbad2c2224..fad7b923ca9 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java
@@ -976,7 +976,7 @@ public abstract class SeekableStreamIndexTaskRunner<PartitionIdType, SequenceOff
             sequenceMetadata.getCommitterSupplier(this, stream, lastPersistedOffsets).get(),
             Collections.singletonList(sequenceMetadata.getSequenceName())
         ),
-        (Function<SegmentsAndCommitMetadata, SegmentsAndCommitMetadata>) publishedSegmentsAndMetadata -> {
+        publishedSegmentsAndMetadata -> {
           if (publishedSegmentsAndMetadata == null) {
             throw new ISE(
                 "Transaction failure publishing segments for sequence [%s]",
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SequenceMetadata.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SequenceMetadata.java
index c3832391be8..2da858f80cc 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SequenceMetadata.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SequenceMetadata.java
@@ -393,15 +393,13 @@ public class SequenceMetadata<PartitionIdType, SequenceOffsetType>
           // if we created no segments and didn't change any offsets, just do nothing and return.
           log.info(
               "With empty segment set, start offsets [%s] and end offsets [%s] are the same, skipping metadata commit.",
-              startPartitions,
-              finalPartitions
+              startPartitions, finalPartitions
           );
           return SegmentPublishResult.ok(segmentsToPush);
         } else {
           log.info(
               "With empty segment set, start offsets [%s] and end offsets [%s] changed, committing new metadata.",
-              startPartitions,
-              finalPartitions
+              startPartitions, finalPartitions
           );
           action = SegmentTransactionalInsertAction.commitMetadataOnlyAction(
               runner.getAppenderator().getDataSource(),
@@ -419,12 +417,10 @@ public class SequenceMetadata<PartitionIdType, SequenceOffsetType>
         );
         final DataSourceMetadata endMetadata = runner.createDataSourceMetadata(finalPartitions);
         action = taskLockType == TaskLockType.APPEND
-                 ? SegmentTransactionalAppendAction.forSegmentsAndMetadata(segmentsToPush, startMetadata, endMetadata,
-                                                                           segmentSchemaMapping
-        )
-                 : SegmentTransactionalInsertAction.appendAction(segmentsToPush, startMetadata, endMetadata,
-                                                                 segmentSchemaMapping
-                 );
+                 ? SegmentTransactionalAppendAction
+                     .forSegmentsAndMetadata(segmentsToPush, startMetadata, endMetadata, segmentSchemaMapping)
+                 : SegmentTransactionalInsertAction
+                     .appendAction(segmentsToPush, startMetadata, endMetadata, segmentSchemaMapping);
       } else {
         action = taskLockType == TaskLockType.APPEND
                  ? SegmentTransactionalAppendAction.forSegments(segmentsToPush, segmentSchemaMapping)
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentCheckerTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetrieverTest.java
similarity index 96%
rename from indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentCheckerTest.java
rename to indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetrieverTest.java
index 160176c8841..dd1cd5c59ca 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedUsedSegmentCheckerTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetrieverTest.java
@@ -43,16 +43,16 @@ import java.util.List;
 import java.util.Set;
 import java.util.stream.Collectors;
 
-public class ActionBasedUsedSegmentCheckerTest
+public class ActionBasedPublishedSegmentRetrieverTest
 {
   private TaskActionClient taskActionClient;
-  private ActionBasedUsedSegmentChecker segmentRetriever;
+  private ActionBasedPublishedSegmentRetriever segmentRetriever;
 
   @Before
   public void setup()
   {
     taskActionClient = EasyMock.createMock(TaskActionClient.class);
-    segmentRetriever = new ActionBasedUsedSegmentChecker(taskActionClient);
+    segmentRetriever = new ActionBasedPublishedSegmentRetriever(taskActionClient);
   }
 
   @Test
@@ -103,7 +103,6 @@ public class ActionBasedUsedSegmentCheckerTest
         taskActionClient.submit(
             new RetrieveUsedSegmentsAction(
                 "wiki",
-                null,
                 Collections.singletonList(Intervals.of("2013-01-01/P3D")),
                 Segments.INCLUDING_OVERSHADOWED
             )
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/RetrieveUsedSegmentsActionSerdeTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/RetrieveUsedSegmentsActionSerdeTest.java
index 99675fd57bb..6ae9fc80e3c 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/RetrieveUsedSegmentsActionSerdeTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/RetrieveUsedSegmentsActionSerdeTest.java
@@ -28,6 +28,7 @@ import org.joda.time.Interval;
 import org.junit.Assert;
 import org.junit.Test;
 
+import java.util.Collections;
 import java.util.List;
 
 /**
@@ -42,7 +43,7 @@ public class RetrieveUsedSegmentsActionSerdeTest
     Interval interval = Intervals.of("2014/2015");
 
     RetrieveUsedSegmentsAction expected =
-        new RetrieveUsedSegmentsAction("dataSource", interval, null, Segments.ONLY_VISIBLE);
+        new RetrieveUsedSegmentsAction("dataSource", Collections.singletonList(interval), Segments.ONLY_VISIBLE);
 
     RetrieveUsedSegmentsAction actual =
         MAPPER.readValue(MAPPER.writeValueAsString(expected), RetrieveUsedSegmentsAction.class);
@@ -68,11 +69,15 @@ public class RetrieveUsedSegmentsActionSerdeTest
   @Test
   public void testOldJsonDeserialization() throws Exception
   {
-    String jsonStr = "{\"type\": \"segmentListUsed\", \"dataSource\": \"test\", \"interval\": \"2014/2015\"}";
+    String jsonStr = "{\"type\": \"segmentListUsed\", \"dataSource\": \"test\", \"intervals\": [\"2014/2015\"]}";
     RetrieveUsedSegmentsAction actual = (RetrieveUsedSegmentsAction) MAPPER.readValue(jsonStr, TaskAction.class);
 
     Assert.assertEquals(
-        new RetrieveUsedSegmentsAction("test", Intervals.of("2014/2015"), null, Segments.ONLY_VISIBLE),
+        new RetrieveUsedSegmentsAction(
+            "test",
+            Collections.singletonList(Intervals.of("2014/2015")),
+            Segments.ONLY_VISIBLE
+        ),
         actual
     );
   }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentTransactionalInsertActionTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentTransactionalInsertActionTest.java
index f158ef1980c..44ce60b5ceb 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentTransactionalInsertActionTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentTransactionalInsertActionTest.java
@@ -35,18 +35,13 @@ import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.partition.LinearShardSpec;
 import org.assertj.core.api.Assertions;
-import org.hamcrest.CoreMatchers;
 import org.joda.time.Interval;
 import org.junit.Assert;
 import org.junit.Rule;
 import org.junit.Test;
-import org.junit.rules.ExpectedException;
 
 public class SegmentTransactionalInsertActionTest
 {
-  @Rule
-  public ExpectedException thrown = ExpectedException.none();
-
   @Rule
   public TaskActionTestKit actionTestKit = new TaskActionTestKit();
 
@@ -157,8 +152,8 @@ public class SegmentTransactionalInsertActionTest
     Assert.assertEquals(
         SegmentPublishResult.fail(
             InvalidInput.exception(
-                "The new start metadata state[ObjectMetadata{theObject=[1]}] is ahead of the last commited end"
-                + " state[null]. Try resetting the supervisor."
+                "The new start metadata state[ObjectMetadata{theObject=[1]}] is"
+                + " ahead of the last committed end state[null]. Try resetting the supervisor."
             ).toString()
         ),
         result
@@ -169,17 +164,15 @@ public class SegmentTransactionalInsertActionTest
   public void testFailBadVersion() throws Exception
   {
     final Task task = NoopTask.create();
-    final SegmentTransactionalInsertAction action = SegmentTransactionalInsertAction.overwriteAction(
-        null,
-        ImmutableSet.of(SEGMENT3),
-        null
-    );
+    final SegmentTransactionalInsertAction action = SegmentTransactionalInsertAction
+        .overwriteAction(null, ImmutableSet.of(SEGMENT3), null);
     actionTestKit.getTaskLockbox().add(task);
     acquireTimeChunkLock(TaskLockType.EXCLUSIVE, task, INTERVAL, 5000);
 
-    thrown.expect(IllegalStateException.class);
-    thrown.expectMessage(CoreMatchers.containsString("are not covered by locks"));
-    SegmentPublishResult result = action.perform(task, actionTestKit.getTaskActionToolbox());
-    Assert.assertEquals(SegmentPublishResult.ok(ImmutableSet.of(SEGMENT3)), result);
+    IllegalStateException exception = Assert.assertThrows(
+        IllegalStateException.class,
+        () -> action.perform(task, actionTestKit.getTaskActionToolbox())
+    );
+    Assert.assertTrue(exception.getMessage().contains("are not covered by locks"));
   }
 }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/concurrent/ConcurrentReplaceAndAppendTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/concurrent/ConcurrentReplaceAndAppendTest.java
index a62d477ef09..f179e4707ec 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/concurrent/ConcurrentReplaceAndAppendTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/concurrent/ConcurrentReplaceAndAppendTest.java
@@ -984,7 +984,6 @@ public class ConcurrentReplaceAndAppendTest extends IngestionTestBase
       Collection<DataSegment> allUsedSegments = dummyTaskActionClient.submit(
           new RetrieveUsedSegmentsAction(
               WIKI,
-              null,
               ImmutableList.of(interval),
               visibility
           )
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/concurrent/ConcurrentReplaceAndStreamingAppendTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/concurrent/ConcurrentReplaceAndStreamingAppendTest.java
index 4f599e24493..a8ce15538d3 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/concurrent/ConcurrentReplaceAndStreamingAppendTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/concurrent/ConcurrentReplaceAndStreamingAppendTest.java
@@ -709,7 +709,6 @@ public class ConcurrentReplaceAndStreamingAppendTest extends IngestionTestBase
       Collection<DataSegment> allUsedSegments = dummyTaskActionClient.submit(
           new RetrieveUsedSegmentsAction(
               WIKI,
-              null,
               ImmutableList.of(interval),
               visibility
           )
@@ -829,7 +828,6 @@ public class ConcurrentReplaceAndStreamingAppendTest extends IngestionTestBase
       return dummyTaskActionClient.submit(
           new RetrieveUsedSegmentsAction(
               WIKI,
-              null,
               ImmutableList.of(Intervals.ETERNITY),
               Segments.INCLUDING_OVERSHADOWED
           )
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
index 31a40277b8e..61a57e94842 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
@@ -85,9 +85,9 @@ public class TestIndexerMetadataStorageCoordinator implements IndexerMetadataSto
   }
 
   @Override
-  public List<DataSegment> retrieveAllUsedSegments(String dataSource, Segments visibility)
+  public Set<DataSegment> retrieveAllUsedSegments(String dataSource, Segments visibility)
   {
-    return ImmutableList.of();
+    return ImmutableSet.of();
   }
 
   @Override
@@ -97,13 +97,13 @@ public class TestIndexerMetadataStorageCoordinator implements IndexerMetadataSto
   }
 
   @Override
-  public List<DataSegment> retrieveUsedSegmentsForIntervals(
+  public Set<DataSegment> retrieveUsedSegmentsForIntervals(
       String dataSource,
       List<Interval> intervals,
       Segments visibility
   )
   {
-    return ImmutableList.of();
+    return ImmutableSet.of();
   }
 
   @Override
diff --git a/processing/src/main/java/org/apache/druid/common/config/ConfigManager.java b/processing/src/main/java/org/apache/druid/common/config/ConfigManager.java
index a9be4c6bf2d..7ba1481e97d 100644
--- a/processing/src/main/java/org/apache/druid/common/config/ConfigManager.java
+++ b/processing/src/main/java/org/apache/druid/common/config/ConfigManager.java
@@ -61,7 +61,11 @@ public class ConfigManager
   private volatile PollingCallable poller;
 
   @Inject
-  public ConfigManager(MetadataStorageConnector dbConnector, Supplier<MetadataStorageTablesConfig> dbTables, Supplier<ConfigManagerConfig> config)
+  public ConfigManager(
+      MetadataStorageConnector dbConnector,
+      Supplier<MetadataStorageTablesConfig> dbTables,
+      Supplier<ConfigManagerConfig> config
+  )
   {
     this.dbConnector = dbConnector;
     this.config = config;
diff --git a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
index 9452d19485f..c055a8d9e9f 100644
--- a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
@@ -39,32 +39,15 @@ import java.util.Map;
 import java.util.Set;
 
 /**
+ * Handles metadata transactions performed by the Overlord.
  */
 public interface IndexerMetadataStorageCoordinator
 {
   /**
-   * Retrieve all published segments which may include any data in the interval and are marked as used from the
-   * metadata store.
-   *
-   * The order of segments within the returned collection is unspecified, but each segment is guaranteed to appear in
-   * the collection only once.
-   *
-   * @param dataSource The data source to query
-   * @param interval   The interval for which all applicable and used segmented are requested.
-   * @param visibility Whether only visible or visible as well as overshadowed segments should be returned. The
-   *                   visibility is considered within the specified interval: that is, a segment which is visible
-   *                   outside of the specified interval, but overshadowed within the specified interval will not be
-   *                   returned if {@link Segments#ONLY_VISIBLE} is passed. See more precise description in the doc for
-   *                   {@link Segments}.
-   * @return The DataSegments which include data in the requested interval. These segments may contain data outside the
-   *         requested interval.
-   *
-   * @implNote This method doesn't return a {@link Set} because there may be an expectation that {@code Set.contains()}
-   * is O(1) operation, while it's not the case for the returned collection unless it copies all segments into a new
-   * {@link java.util.HashSet} or {@link com.google.common.collect.ImmutableSet} which may in turn be unnecessary in
-   * other use cases. So clients should perform such copy themselves if they need {@link Set} semantics.
+   * Retrieves all published segments that have partial or complete overlap with
+   * the given interval and are marked as used.
    */
-  default Collection<DataSegment> retrieveUsedSegmentsForInterval(
+  default Set<DataSegment> retrieveUsedSegmentsForInterval(
       String dataSource,
       Interval interval,
       Segments visibility
@@ -74,21 +57,16 @@ public interface IndexerMetadataStorageCoordinator
   }
 
   /**
-   * Retrieve all published used segments in the data source from the metadata store.
+   * Retrieves all published used segments for the given data source.
    *
-   * @param dataSource The data source to query
-   *
-   * @return all segments belonging to the given data source
-   * @see #retrieveUsedSegmentsForInterval(String, Interval, Segments) similar to this method but also accepts data
-   * interval.
+   * @see #retrieveUsedSegmentsForInterval(String, Interval, Segments)
    */
-  Collection<DataSegment> retrieveAllUsedSegments(String dataSource, Segments visibility);
+  Set<DataSegment> retrieveAllUsedSegments(String dataSource, Segments visibility);
 
   /**
-   *
    * Retrieve all published segments which are marked as used and the created_date of these segments belonging to the
    * given data source and list of intervals from the metadata store.
-   *
+   * <p>
    * Unlike other similar methods in this interface, this method doesn't accept a {@link Segments} "visibility"
    * parameter. The returned collection may include overshadowed segments and their created_dates, as if {@link
    * Segments#INCLUDING_OVERSHADOWED} was passed. It's the responsibility of the caller to filter out overshadowed ones
@@ -99,32 +77,16 @@ public interface IndexerMetadataStorageCoordinator
    *
    * @return The DataSegments and the related created_date of segments
    */
-  Collection<Pair<DataSegment, String>> retrieveUsedSegmentsAndCreatedDates(String dataSource, List<Interval> intervals);
+  Collection<Pair<DataSegment, String>> retrieveUsedSegmentsAndCreatedDates(
+      String dataSource,
+      List<Interval> intervals
+  );
 
   /**
-   * Retrieve all published segments which may include any data in the given intervals and are marked as used from the
-   * metadata store.
-   * <p>
-   * The order of segments within the returned collection is unspecified, but each segment is guaranteed to appear in
-   * the collection only once.
-   * </p>
-   *
-   * @param dataSource The data source to query
-   * @param intervals  The intervals for which all applicable and used segments are requested.
-   * @param visibility Whether only visible or visible as well as overshadowed segments should be returned. The
-   *                   visibility is considered within the specified intervals: that is, a segment which is visible
-   *                   outside of the specified intervals, but overshadowed on the specified intervals will not be
-   *                   returned if {@link Segments#ONLY_VISIBLE} is passed. See more precise description in the doc for
-   *                   {@link Segments}.
-   * @return The DataSegments which include data in the requested intervals. These segments may contain data outside the
-   *         requested intervals.
-   *
-   * @implNote This method doesn't return a {@link Set} because there may be an expectation that {@code Set.contains()}
-   * is O(1) operation, while it's not the case for the returned collection unless it copies all segments into a new
-   * {@link java.util.HashSet} or {@link com.google.common.collect.ImmutableSet} which may in turn be unnecessary in
-   * other use cases. So clients should perform such copy themselves if they need {@link Set} semantics.
+   * Retrieves all published segments that have partial or complete overlap with
+   * the given intervals and are marked as used.
    */
-  Collection<DataSegment> retrieveUsedSegmentsForIntervals(
+  Set<DataSegment> retrieveUsedSegmentsForIntervals(
       String dataSource,
       List<Interval> intervals,
       Segments visibility
diff --git a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
index 75d296923fb..fd637728908 100644
--- a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
@@ -152,7 +152,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
   }
 
   @Override
-  public Collection<DataSegment> retrieveUsedSegmentsForIntervals(
+  public Set<DataSegment> retrieveUsedSegmentsForIntervals(
       final String dataSource,
       final List<Interval> intervals,
       final Segments visibility
@@ -165,7 +165,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
   }
 
   @Override
-  public Collection<DataSegment> retrieveAllUsedSegments(String dataSource, Segments visibility)
+  public Set<DataSegment> retrieveAllUsedSegments(String dataSource, Segments visibility)
   {
     return doRetrieveUsedSegments(dataSource, Collections.emptyList(), visibility);
   }
@@ -173,7 +173,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
   /**
    * @param intervals empty list means unrestricted interval.
    */
-  private Collection<DataSegment> doRetrieveUsedSegments(
+  private Set<DataSegment> doRetrieveUsedSegments(
       final String dataSource,
       final List<Interval> intervals,
       final Segments visibility
@@ -431,7 +431,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
     }
   }
 
-  private Collection<DataSegment> retrieveAllUsedSegmentsForIntervalsWithHandle(
+  private Set<DataSegment> retrieveAllUsedSegmentsForIntervalsWithHandle(
       final Handle handle,
       final String dataSource,
       final List<Interval> intervals
@@ -440,7 +440,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
     try (final CloseableIterator<DataSegment> iterator =
              SqlSegmentsMetadataQuery.forHandle(handle, connector, dbTables, jsonMapper)
                                      .retrieveUsedSegments(dataSource, intervals)) {
-      final List<DataSegment> retVal = new ArrayList<>();
+      final Set<DataSegment> retVal = new HashSet<>();
       iterator.forEachRemaining(retVal::add);
       return retVal;
     }
@@ -2564,8 +2564,6 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
    * oldCommitMetadata when this function is called (based on T.equals). This method is idempotent in that if
    * the metadata already equals newCommitMetadata, it will return true.
    *
-   * @param handle        database handle
-   * @param dataSource    druid dataSource
    * @param startMetadata dataSource metadata pre-insert must match this startMetadata according to
    *                      {@link DataSourceMetadata#matches(DataSourceMetadata)}
    * @param endMetadata   dataSource metadata post-insert will have this endMetadata merged in with
@@ -2627,15 +2625,16 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
 
     if (startMetadataGreaterThanExisting && !startMetadataMatchesExisting) {
       // Offsets stored in startMetadata is greater than the last commited metadata.
-      return new DataStoreMetadataUpdateResult(true, false,
-          "The new start metadata state[%s] is ahead of the last commited"
-          + " end state[%s]. Try resetting the supervisor.", startMetadata, oldCommitMetadataFromDb
+      return DataStoreMetadataUpdateResult.failure(
+          "The new start metadata state[%s] is ahead of the last committed"
+          + " end state[%s]. Try resetting the supervisor.",
+          startMetadata, oldCommitMetadataFromDb
       );
     }
 
     if (!startMetadataMatchesExisting) {
       // Not in the desired start state.
-      return new DataStoreMetadataUpdateResult(true, false,
+      return DataStoreMetadataUpdateResult.failure(
           "Inconsistency between stored metadata state[%s] and target state[%s]. Try resetting the supervisor.",
           oldCommitMetadataFromDb, startMetadata
       );
@@ -2668,11 +2667,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
 
       retVal = numRows == 1
           ? DataStoreMetadataUpdateResult.SUCCESS
-          : new DataStoreMetadataUpdateResult(
-              true,
-          true,
-          "Failed to insert metadata for datasource [%s]",
-          dataSource);
+          : DataStoreMetadataUpdateResult.retryableFailure("Failed to insert metadata for datasource[%s]", dataSource);
     } else {
       // Expecting a particular old metadata; use the SHA1 in a compare-and-swap UPDATE
       final int numRows = handle.createStatement(
@@ -2692,11 +2687,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
 
       retVal = numRows == 1
           ? DataStoreMetadataUpdateResult.SUCCESS
-          : new DataStoreMetadataUpdateResult(
-          true,
-          true,
-          "Failed to update metadata for datasource [%s]",
-          dataSource);
+          : DataStoreMetadataUpdateResult.retryableFailure("Failed to update metadata for datasource[%s]", dataSource);
     }
 
     if (retVal.isSuccess()) {
@@ -2712,19 +2703,12 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
   public boolean deleteDataSourceMetadata(final String dataSource)
   {
     return connector.retryWithHandle(
-        new HandleCallback<Boolean>()
-        {
-          @Override
-          public Boolean withHandle(Handle handle)
-          {
-            int rows = handle.createStatement(
-                StringUtils.format("DELETE from %s WHERE dataSource = :dataSource", dbTables.getDataSourceTable())
-            )
-                             .bind("dataSource", dataSource)
-                             .execute();
+        handle -> {
+          int rows = handle.createStatement(
+              StringUtils.format("DELETE from %s WHERE dataSource = :dataSource", dbTables.getDataSourceTable())
+          ).bind("dataSource", dataSource).execute();
 
-            return rows > 0;
-          }
+          return rows > 0;
         }
     );
   }
@@ -2767,17 +2751,12 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
   public void updateSegmentMetadata(final Set<DataSegment> segments)
   {
     connector.getDBI().inTransaction(
-        new TransactionCallback<Void>()
-        {
-          @Override
-          public Void inTransaction(Handle handle, TransactionStatus transactionStatus) throws Exception
-          {
-            for (final DataSegment segment : segments) {
-              updatePayload(handle, segment);
-            }
-
-            return null;
+        (handle, transactionStatus) -> {
+          for (final DataSegment segment : segments) {
+            updatePayload(handle, segment);
           }
+
+          return 0;
         }
     );
   }
@@ -2990,10 +2969,21 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
   {
     private final boolean failed;
     private final boolean canRetry;
-    @Nullable private final String errorMsg;
+    @Nullable
+    private final String errorMsg;
 
     public static final DataStoreMetadataUpdateResult SUCCESS = new DataStoreMetadataUpdateResult(false, false, null);
 
+    public static DataStoreMetadataUpdateResult failure(String errorMsgFormat, Object... messageArgs)
+    {
+      return new DataStoreMetadataUpdateResult(true, false, errorMsgFormat, messageArgs);
+    }
+
+    public static DataStoreMetadataUpdateResult retryableFailure(String errorMsgFormat, Object... messageArgs)
+    {
+      return new DataStoreMetadataUpdateResult(true, true, errorMsgFormat, messageArgs);
+    }
+
     DataStoreMetadataUpdateResult(boolean failed, boolean canRetry, @Nullable String errorMsg, Object... errorFormatArgs)
     {
       this.failed = failed;
@@ -3022,34 +3012,5 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
     {
       return errorMsg;
     }
-
-    @Override
-    public boolean equals(Object o)
-    {
-      if (this == o) {
-        return true;
-      }
-      if (o == null || getClass() != o.getClass()) {
-        return false;
-      }
-      DataStoreMetadataUpdateResult that = (DataStoreMetadataUpdateResult) o;
-      return failed == that.failed && canRetry == that.canRetry && Objects.equals(errorMsg, that.errorMsg);
-    }
-
-    @Override
-    public int hashCode()
-    {
-      return Objects.hash(failed, canRetry, errorMsg);
-    }
-
-    @Override
-    public String toString()
-    {
-      return "DataStoreMetadataUpdateResult{" +
-          "failed=" + failed +
-          ", canRetry=" + canRetry +
-          ", errorMsg='" + errorMsg + '\'' +
-          '}';
-    }
   }
 }
diff --git a/server/src/main/java/org/apache/druid/metadata/SQLMetadataConnector.java b/server/src/main/java/org/apache/druid/metadata/SQLMetadataConnector.java
index cd927b2fef8..2d315d19fc8 100644
--- a/server/src/main/java/org/apache/druid/metadata/SQLMetadataConnector.java
+++ b/server/src/main/java/org/apache/druid/metadata/SQLMetadataConnector.java
@@ -318,7 +318,7 @@ public abstract class SQLMetadataConnector implements MetadataStorageConnector
 
   public void createSegmentTable(final String tableName)
   {
-    List<String> columns = new ArrayList<>();
+    final List<String> columns = new ArrayList<>();
     columns.add("id VARCHAR(255) NOT NULL");
     columns.add("dataSource VARCHAR(255) %4$s NOT NULL");
     columns.add("created_date VARCHAR(255) NOT NULL");
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BaseAppenderatorDriver.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BaseAppenderatorDriver.java
index a192111db4a..fa7d037c92c 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BaseAppenderatorDriver.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BaseAppenderatorDriver.java
@@ -254,7 +254,7 @@ public abstract class BaseAppenderatorDriver implements Closeable
   private static final Logger log = new Logger(BaseAppenderatorDriver.class);
 
   private final SegmentAllocator segmentAllocator;
-  private final UsedSegmentChecker usedSegmentChecker;
+  private final PublishedSegmentRetriever publishedSegmentRetriever;
   private final DataSegmentKiller dataSegmentKiller;
 
   protected final Appenderator appenderator;
@@ -269,13 +269,13 @@ public abstract class BaseAppenderatorDriver implements Closeable
   BaseAppenderatorDriver(
       Appenderator appenderator,
       SegmentAllocator segmentAllocator,
-      UsedSegmentChecker usedSegmentChecker,
+      PublishedSegmentRetriever segmentRetriever,
       DataSegmentKiller dataSegmentKiller
   )
   {
     this.appenderator = Preconditions.checkNotNull(appenderator, "appenderator");
     this.segmentAllocator = Preconditions.checkNotNull(segmentAllocator, "segmentAllocator");
-    this.usedSegmentChecker = Preconditions.checkNotNull(usedSegmentChecker, "segmentRetriever");
+    this.publishedSegmentRetriever = Preconditions.checkNotNull(segmentRetriever, "segmentRetriever");
     this.dataSegmentKiller = Preconditions.checkNotNull(dataSegmentKiller, "dataSegmentKiller");
     this.executor = MoreExecutors.listeningDecorator(
         Execs.singleThreaded("[" + StringUtils.encodeForFormat(appenderator.getId()) + "]-publish")
@@ -665,7 +665,7 @@ public abstract class BaseAppenderatorDriver implements Closeable
                       .map(DataSegment::getId)
                       .collect(Collectors.toSet());
 
-                  final Set<DataSegment> publishedSegments = usedSegmentChecker.findPublishedSegments(segmentIds);
+                  final Set<DataSegment> publishedSegments = publishedSegmentRetriever.findPublishedSegments(segmentIds);
                   if (publishedSegments.equals(ourSegments)) {
                     log.info(
                         "Could not publish [%d] segments, but they have already been published by another task.",
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BatchAppenderatorDriver.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BatchAppenderatorDriver.java
index e08fcf601df..81a02ab1eec 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BatchAppenderatorDriver.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/BatchAppenderatorDriver.java
@@ -61,20 +61,16 @@ import java.util.stream.Collectors;
 public class BatchAppenderatorDriver extends BaseAppenderatorDriver
 {
   /**
-   * Create a driver.
-   *
-   * @param appenderator       appenderator
-   * @param segmentAllocator   segment allocator
-   * @param usedSegmentChecker used segment checker
+   * Creates a driver for batch ingestion.
    */
   public BatchAppenderatorDriver(
       Appenderator appenderator,
       SegmentAllocator segmentAllocator,
-      UsedSegmentChecker usedSegmentChecker,
+      PublishedSegmentRetriever segmentRetriever,
       DataSegmentKiller dataSegmentKiller
   )
   {
-    super(appenderator, segmentAllocator, usedSegmentChecker, dataSegmentKiller);
+    super(appenderator, segmentAllocator, segmentRetriever, dataSegmentKiller);
   }
 
   @Nullable
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UsedSegmentChecker.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/PublishedSegmentRetriever.java
similarity index 96%
rename from server/src/main/java/org/apache/druid/segment/realtime/appenderator/UsedSegmentChecker.java
rename to server/src/main/java/org/apache/druid/segment/realtime/appenderator/PublishedSegmentRetriever.java
index 3ab966009b0..3f2d239f3be 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/UsedSegmentChecker.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/PublishedSegmentRetriever.java
@@ -25,7 +25,7 @@ import org.apache.druid.timeline.SegmentId;
 import java.io.IOException;
 import java.util.Set;
 
-public interface UsedSegmentChecker
+public interface PublishedSegmentRetriever
 {
   /**
    * For any identifiers that exist and are actually used, returns the corresponding DataSegment objects.
diff --git a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriver.java b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriver.java
index 89115874916..68599dbea11 100644
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriver.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriver.java
@@ -91,7 +91,7 @@ public class StreamAppenderatorDriver extends BaseAppenderatorDriver
    * @param appenderator           appenderator
    * @param segmentAllocator       segment allocator
    * @param handoffNotifierFactory handoff notifier factory
-   * @param usedSegmentChecker     used segment checker
+   * @param segmentRetriever     used segment checker
    * @param objectMapper           object mapper, used for serde of commit metadata
    * @param metrics                Firedepartment metrics
    */
@@ -99,13 +99,13 @@ public class StreamAppenderatorDriver extends BaseAppenderatorDriver
       Appenderator appenderator,
       SegmentAllocator segmentAllocator,
       SegmentHandoffNotifierFactory handoffNotifierFactory,
-      UsedSegmentChecker usedSegmentChecker,
+      PublishedSegmentRetriever segmentRetriever,
       DataSegmentKiller dataSegmentKiller,
       ObjectMapper objectMapper,
       SegmentGenerationMetrics metrics
   )
   {
-    super(appenderator, segmentAllocator, usedSegmentChecker, dataSegmentKiller);
+    super(appenderator, segmentAllocator, segmentRetriever, dataSegmentKiller);
 
     this.handoffNotifier = Preconditions.checkNotNull(handoffNotifierFactory, "handoffNotifierFactory")
                                         .createSegmentHandoffNotifier(appenderator.getDataSource());
@@ -416,7 +416,7 @@ public class StreamAppenderatorDriver extends BaseAppenderatorDriver
   {
     return Futures.transformAsync(
         publish(publisher, committer, sequenceNames),
-        (AsyncFunction<SegmentsAndCommitMetadata, SegmentsAndCommitMetadata>) this::registerHandoff,
+        this::registerHandoff,
         MoreExecutors.directExecutor()
     );
   }
diff --git a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
index a782a72e646..222c1ece89f 100644
--- a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
+++ b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
@@ -523,7 +523,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
       {
         metadataUpdateCounter.getAndIncrement();
         if (attemptCounter.getAndIncrement() == 0) {
-          return new DataStoreMetadataUpdateResult(true, true, null);
+          return DataStoreMetadataUpdateResult.retryableFailure(null);
         } else {
           return super.updateDataSourceMetadataWithHandle(handle, dataSource, startMetadata, endMetadata);
         }
@@ -593,7 +593,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
     Assert.assertEquals(
         SegmentPublishResult.fail(
             InvalidInput.exception(
-                "The new start metadata state[ObjectMetadata{theObject={foo=bar}}] is ahead of the last commited"
+                "The new start metadata state[ObjectMetadata{theObject={foo=bar}}] is ahead of the last committed"
                 + " end state[null]. Try resetting the supervisor."
             ).toString()),
         result1
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/ClosedSegmentsSinksBatchAppenderatorDriverTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/ClosedSegmentsSinksBatchAppenderatorDriverTest.java
index cc5a7f282eb..269aeaca7c4 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/ClosedSegmentsSinksBatchAppenderatorDriverTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/ClosedSegmentsSinksBatchAppenderatorDriverTest.java
@@ -95,7 +95,7 @@ public class ClosedSegmentsSinksBatchAppenderatorDriverTest extends EasyMockSupp
     driver = new BatchAppenderatorDriver(
         appenderatorTester.getAppenderator(),
         allocator,
-        new TestUsedSegmentChecker(appenderatorTester.getPushedSegments()),
+        new TestPublishedSegmentRetriever(appenderatorTester.getPushedSegments()),
         dataSegmentKiller
     );
 
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/OpenAndClosedSegmentsBatchAppenderatorDriverTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/OpenAndClosedSegmentsBatchAppenderatorDriverTest.java
index ba8f097b669..0c6fb552a4d 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/OpenAndClosedSegmentsBatchAppenderatorDriverTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/OpenAndClosedSegmentsBatchAppenderatorDriverTest.java
@@ -93,7 +93,7 @@ public class OpenAndClosedSegmentsBatchAppenderatorDriverTest extends EasyMockSu
     driver = new BatchAppenderatorDriver(
         openAndClosedSegmentsAppenderatorTester.getAppenderator(),
         allocator,
-        new TestUsedSegmentChecker(openAndClosedSegmentsAppenderatorTester.getPushedSegments()),
+        new TestPublishedSegmentRetriever(openAndClosedSegmentsAppenderatorTester.getPushedSegments()),
         dataSegmentKiller
     );
 
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java
index bdc6f64c90a..ed3fe97d6cc 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverFailTest.java
@@ -133,7 +133,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
         createPersistFailAppenderator(),
         allocator,
         segmentHandoffNotifierFactory,
-        new NoopUsedSegmentChecker(),
+        new NoopPublishedSegmentRetriever(),
         dataSegmentKiller,
         OBJECT_MAPPER,
         new SegmentGenerationMetrics()
@@ -171,7 +171,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
         createPushFailAppenderator(),
         allocator,
         segmentHandoffNotifierFactory,
-        new NoopUsedSegmentChecker(),
+        new NoopPublishedSegmentRetriever(),
         dataSegmentKiller,
         OBJECT_MAPPER,
         new SegmentGenerationMetrics()
@@ -209,7 +209,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
         createDropFailAppenderator(),
         allocator,
         segmentHandoffNotifierFactory,
-        new NoopUsedSegmentChecker(),
+        new NoopPublishedSegmentRetriever(),
         dataSegmentKiller,
         OBJECT_MAPPER,
         new SegmentGenerationMetrics()
@@ -260,7 +260,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
         new FailableAppenderator(),
         allocator,
         segmentHandoffNotifierFactory,
-        new NoopUsedSegmentChecker(),
+        new NoopPublishedSegmentRetriever(),
         dataSegmentKiller,
         OBJECT_MAPPER,
         new SegmentGenerationMetrics()
@@ -324,7 +324,7 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
     }
   }
 
-  private static class NoopUsedSegmentChecker implements UsedSegmentChecker
+  private static class NoopPublishedSegmentRetriever implements PublishedSegmentRetriever
   {
     @Override
     public Set<DataSegment> findPublishedSegments(Set<SegmentId> identifiers)
@@ -338,11 +338,6 @@ public class StreamAppenderatorDriverFailTest extends EasyMockSupport
     return new FailableAppenderator().disablePush();
   }
 
-  static Appenderator createPushInterruptAppenderator()
-  {
-    return new FailableAppenderator().interruptPush();
-  }
-
   static Appenderator createPersistFailAppenderator()
   {
     return new FailableAppenderator().disablePersist();
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverTest.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverTest.java
index eae1148027d..69528b339ff 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/StreamAppenderatorDriverTest.java
@@ -127,7 +127,7 @@ public class StreamAppenderatorDriverTest extends EasyMockSupport
         streamAppenderatorTester.getAppenderator(),
         allocator,
         segmentHandoffNotifierFactory,
-        new TestUsedSegmentChecker(streamAppenderatorTester.getPushedSegments()),
+        new TestPublishedSegmentRetriever(streamAppenderatorTester.getPushedSegments()),
         dataSegmentKiller,
         OBJECT_MAPPER,
         new SegmentGenerationMetrics()
diff --git a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestUsedSegmentChecker.java b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestPublishedSegmentRetriever.java
similarity index 92%
rename from server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestUsedSegmentChecker.java
rename to server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestPublishedSegmentRetriever.java
index 37612b11776..8042c798a87 100644
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestUsedSegmentChecker.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/TestPublishedSegmentRetriever.java
@@ -29,11 +29,11 @@ import java.util.HashSet;
 import java.util.List;
 import java.util.Set;
 
-public class TestUsedSegmentChecker implements UsedSegmentChecker
+public class TestPublishedSegmentRetriever implements PublishedSegmentRetriever
 {
   private final List<DataSegment> pushedSegments;
 
-  public TestUsedSegmentChecker(List<DataSegment> pushedSegments)
+  public TestPublishedSegmentRetriever(List<DataSegment> pushedSegments)
   {
     this.pushedSegments = pushedSegments;
   }

From 71b3b5ab5deb71338a01581add03a941eaec8a6e Mon Sep 17 00:00:00 2001
From: Laksh Singla <lakshsingla@gmail.com>
Date: Wed, 26 Jun 2024 15:00:30 +0530
Subject: [PATCH 25/72] Add query context parameter to remove null bytes when
 writing frames (#16579)

MSQ cannot process null bytes in string fields, and the current workaround is to remove them using the REPLACE function. 'removeNullBytes' context parameter has been added which sanitizes the input string fields by removing these null bytes.
---
 .../frame/FrameChannelMergerBenchmark.java    |  6 +-
 docs/multi-stage-query/reference.md           |  1 +
 .../apache/druid/msq/exec/ControllerImpl.java |  3 +-
 .../org/apache/druid/msq/exec/WorkerImpl.java | 22 +++--
 .../indexing/IndexerControllerContext.java    |  4 +-
 .../druid/msq/indexing/InputChannelsImpl.java | 12 ++-
 .../indexing/error/InvalidNullByteFault.java  |  3 +-
 ...SegmentGeneratorFrameProcessorFactory.java |  3 +-
 .../msq/kernel/FrameProcessorFactory.java     |  3 +-
 .../druid/msq/kernel/StageDefinition.java     | 13 ++-
 .../BaseLeafFrameProcessorFactory.java        |  5 +-
 ...dowOperatorQueryFrameProcessorFactory.java |  5 +-
 .../OffsetLimitFrameProcessorFactory.java     |  5 +-
 .../SortMergeJoinFrameProcessorFactory.java   |  5 +-
 ...oupByPostShuffleFrameProcessorFactory.java |  5 +-
 .../ExportResultsFrameProcessorFactory.java   |  3 +-
 .../QueryResultFrameProcessorFactory.java     |  3 +-
 .../msq/util/MultiStageQueryContext.java      | 14 ++-
 .../msq/exec/MSQParseExceptionsTest.java      | 94 +++++++++++++++++++
 .../SortMergeJoinFrameProcessorTest.java      |  6 +-
 .../scan/ScanQueryFrameProcessorTest.java     |  6 +-
 .../msq/util/MultiStageQueryContextTest.java  | 19 ++++
 .../allocation/MemoryAllocatorFactory.java    |  2 +-
 .../druid/frame/field/FieldWriters.java       | 17 ++--
 .../frame/field/StringArrayFieldWriter.java   |  7 +-
 .../druid/frame/field/StringFieldWriter.java  | 17 +++-
 .../druid/frame/processor/SuperSorter.java    | 13 ++-
 .../apache/druid/frame/write/FrameWriter.java |  2 +-
 .../druid/frame/write/FrameWriterUtils.java   | 84 +++++++++++++----
 .../druid/frame/write/FrameWriters.java       | 26 +++--
 .../write/RowBasedFrameWriterFactory.java     | 11 ++-
 .../columnar/StringFrameColumnWriter.java     |  5 +-
 .../groupby/GroupByQueryQueryToolChest.java   |  4 +-
 .../LazilyDecoratedRowsAndColumns.java        |  7 +-
 .../StorageAdapterRowsAndColumns.java         |  4 +-
 .../scan/ScanResultValueFramesIterable.java   |  5 +-
 .../TimeseriesQueryQueryToolChest.java        |  4 +-
 .../query/topn/TopNQueryQueryToolChest.java   |  4 +-
 .../field/StringArrayFieldWriterTest.java     |  2 +-
 .../frame/field/StringFieldReaderTest.java    |  2 +-
 .../frame/field/StringFieldWriterTest.java    |  4 +-
 .../apache/druid/frame/key/KeyTestUtils.java  |  7 +-
 .../frame/processor/SuperSorterTest.java      |  6 +-
 .../frame/testutil/FrameSequenceBuilder.java  | 25 +++--
 .../druid/frame/write/FrameWriterTest.java    | 21 +++--
 .../frame/write/FrameWriterUtilsTest.java     | 85 +++++++++++++++++
 .../druid/frame/write/FrameWritersTest.java   | 26 +++--
 ...meBasedInlineDataSourceSerializerTest.java |  7 +-
 .../table/FrameBasedIndexedTableTest.java     |  4 +-
 49 files changed, 469 insertions(+), 172 deletions(-)
 create mode 100644 processing/src/test/java/org/apache/druid/frame/write/FrameWriterUtilsTest.java

diff --git a/benchmarks/src/test/java/org/apache/druid/benchmark/frame/FrameChannelMergerBenchmark.java b/benchmarks/src/test/java/org/apache/druid/benchmark/frame/FrameChannelMergerBenchmark.java
index 43c5dc82a90..a864bcd3419 100644
--- a/benchmarks/src/test/java/org/apache/druid/benchmark/frame/FrameChannelMergerBenchmark.java
+++ b/benchmarks/src/test/java/org/apache/druid/benchmark/frame/FrameChannelMergerBenchmark.java
@@ -351,11 +351,11 @@ public class FrameChannelMergerBenchmark
         channels.stream().map(BlockingQueueFrameChannel::readable).collect(Collectors.toList()),
         frameReader,
         outputChannel.writable(),
-        FrameWriters.makeFrameWriterFactory(
-            FrameType.ROW_BASED,
+        FrameWriters.makeRowBasedFrameWriterFactory(
             new ArenaMemoryAllocatorFactory(1_000_000),
             signature,
-            sortKey
+            sortKey,
+            false
         ),
         sortKey,
         null,
diff --git a/docs/multi-stage-query/reference.md b/docs/multi-stage-query/reference.md
index aeb4305f31e..cf06156c658 100644
--- a/docs/multi-stage-query/reference.md
+++ b/docs/multi-stage-query/reference.md
@@ -410,6 +410,7 @@ The following table lists the context parameters for the MSQ task engine:
 | `skipTypeVerification` | INSERT or REPLACE<br /><br />During query validation, Druid validates that [string arrays](../querying/arrays.md) and [multi-value dimensions](../querying/multi-value-dimensions.md) are not mixed in the same column. If you are intentionally migrating from one to the other, use this context parameter to disable type validation.<br /><br />Provide the column list as comma-separated values or as a JSON array in string form.| empty list |
 | `failOnEmptyInsert` | INSERT or REPLACE<br /><br /> When set to false (the default), an INSERT query generating no output rows will be no-op, and a REPLACE query generating no output rows will delete all data that matches the OVERWRITE clause.  When set to true, an ingest query generating no output rows will throw an `InsertCannotBeEmpty` fault. | `false` |
 | `storeCompactionState` | REPLACE<br /><br /> When set to true, a REPLACE query stores as part of each segment's metadata a `lastCompactionState` field that captures the various specs used to create the segment. Future compaction jobs skip segments whose `lastCompactionState` matches the desired compaction state. Works the same as [`storeCompactionState`](../ingestion/tasks.md#context-parameters) task context flag. | `false` |
+| `removeNullBytes` | SELECT, INSERT or REPLACE<br /><br /> The MSQ engine cannot process null bytes in strings and throws `InvalidNullByteFault` if it encounters them in the source data. If the parameter is set to true, The MSQ engine will remove the null bytes in string fields when reading the data. | `false` |
 
 ## Joins
 
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
index b6541c7f26a..d6732364985 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
@@ -2914,7 +2914,8 @@ public class ControllerImpl implements Controller
             inputChannelFactory,
             () -> ArenaMemoryAllocator.createOnHeap(5_000_000),
             resultReaderExec,
-            cancellationId
+            cancellationId,
+            MultiStageQueryContext.removeNullBytes(querySpec.getQuery().context())
         );
 
         resultsChannel = ReadableConcatFrameChannel.open(
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java
index e76169f7042..84453eaf98b 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java
@@ -36,7 +36,6 @@ import com.google.common.util.concurrent.MoreExecutors;
 import com.google.common.util.concurrent.SettableFuture;
 import it.unimi.dsi.fastutil.bytes.ByteArrays;
 import org.apache.druid.common.guava.FutureUtils;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.ArenaMemoryAllocator;
 import org.apache.druid.frame.allocation.ArenaMemoryAllocatorFactory;
 import org.apache.druid.frame.channel.BlockingQueueFrameChannel;
@@ -184,6 +183,8 @@ public class WorkerImpl implements Worker
   private final ByteTracker intermediateSuperSorterLocalStorageTracker;
   private final boolean durableStageStorageEnabled;
   private final WorkerStorageParameters workerStorageParameters;
+  private final boolean isRemoveNullBytes;
+
   /**
    * Only set for select jobs.
    */
@@ -229,6 +230,7 @@ public class WorkerImpl implements Worker
     QueryContext queryContext = QueryContext.of(task.getContext());
     this.durableStageStorageEnabled = MultiStageQueryContext.isDurableStorageEnabled(queryContext);
     this.selectDestination = MultiStageQueryContext.getSelectDestinationOrNull(queryContext);
+    this.isRemoveNullBytes = MultiStageQueryContext.removeNullBytes(queryContext);
     this.workerStorageParameters = workerStorageParameters;
 
     long maxBytes = workerStorageParameters.isIntermediateStorageLimitConfigured()
@@ -1112,7 +1114,8 @@ public class WorkerImpl implements Worker
               inputChannelFactory,
               () -> ArenaMemoryAllocator.createOnHeap(frameContext.memoryParameters().getStandardFrameSize()),
               exec,
-              cancellationId
+              cancellationId,
+              MultiStageQueryContext.removeNullBytes(QueryContext.of(task.getContext()))
           );
 
       inputSliceReader = new MapInputSliceReader(
@@ -1206,7 +1209,8 @@ public class WorkerImpl implements Worker
               frameContext,
               parallelism,
               counterTracker,
-              e -> warningPublisher.publishException(kernel.getStageDefinition().getStageNumber(), e)
+              e -> warningPublisher.publishException(kernel.getStageDefinition().getStageNumber(), e),
+              isRemoveNullBytes
           );
 
       final ProcessorManager<ProcessorReturnType, ManagerReturnType> processorManager = processors.getProcessorManager();
@@ -1543,7 +1547,8 @@ public class WorkerImpl implements Worker
                 memoryParameters.getSuperSorterMaxChannelsPerProcessor(),
                 -1,
                 cancellationId,
-                counterTracker.sortProgress()
+                counterTracker.sortProgress(),
+                isRemoveNullBytes
             );
 
             return FutureUtils.transform(
@@ -1575,11 +1580,11 @@ public class WorkerImpl implements Worker
                 outputChannels.stream().map(OutputChannel::getWritableChannel).collect(Collectors.toList()),
                 kernel.getStageDefinition().getFrameReader(),
                 kernel.getStageDefinition().getClusterBy().getColumns().size(),
-                FrameWriters.makeFrameWriterFactory(
-                    FrameType.ROW_BASED,
+                FrameWriters.makeRowBasedFrameWriterFactory(
                     new ArenaMemoryAllocatorFactory(frameContext.memoryParameters().getStandardFrameSize()),
                     kernel.getStageDefinition().getSignature(),
-                    kernel.getStageDefinition().getSortKey()
+                    kernel.getStageDefinition().getSortKey(),
+                    isRemoveNullBytes
                 )
             );
 
@@ -1672,7 +1677,8 @@ public class WorkerImpl implements Worker
                         // Tracker is not actually tracked, since it doesn't quite fit into the way we report counters.
                         // There's a single SuperSorterProgressTrackerCounter per worker, but workers that do local
                         // sorting have a SuperSorter per partition.
-                        new SuperSorterProgressTracker()
+                        new SuperSorterProgressTracker(),
+                        isRemoveNullBytes
                     );
 
                     return FutureUtils.transform(sorter.run(), r -> Iterables.getOnlyElement(r.getAllChannels()));
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerControllerContext.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerControllerContext.java
index 17ac82d736b..e960a8aea29 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerControllerContext.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerControllerContext.java
@@ -263,12 +263,14 @@ public class IndexerControllerContext implements ControllerContext
   {
     final ImmutableMap.Builder<String, Object> taskContextOverridesBuilder = ImmutableMap.builder();
     final long maxParseExceptions = MultiStageQueryContext.getMaxParseExceptions(querySpec.getQuery().context());
+    final boolean removeNullBytes = MultiStageQueryContext.removeNullBytes(querySpec.getQuery().context());
 
     taskContextOverridesBuilder
         .put(MultiStageQueryContext.CTX_DURABLE_SHUFFLE_STORAGE, queryKernelConfig.isDurableStorage())
         .put(MSQWarnings.CTX_MAX_PARSE_EXCEPTIONS_ALLOWED, maxParseExceptions)
         .put(MultiStageQueryContext.CTX_IS_REINDEX, MSQControllerTask.isReplaceInputDataSourceTask(querySpec))
-        .put(MultiStageQueryContext.CTX_MAX_CONCURRENT_STAGES, queryKernelConfig.getMaxConcurrentStages());
+        .put(MultiStageQueryContext.CTX_MAX_CONCURRENT_STAGES, queryKernelConfig.getMaxConcurrentStages())
+        .put(MultiStageQueryContext.CTX_REMOVE_NULL_BYTES, removeNullBytes);
 
     // Put the lookup loading info in the task context to facilitate selective loading of lookups.
     if (controllerTaskContext.get(LookupLoadingSpec.CTX_LOOKUP_LOADING_MODE) != null) {
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/InputChannelsImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/InputChannelsImpl.java
index 3414d37a547..2c6539f5930 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/InputChannelsImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/InputChannelsImpl.java
@@ -20,7 +20,6 @@
 package org.apache.druid.msq.indexing;
 
 import com.google.common.collect.Iterables;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.MemoryAllocator;
 import org.apache.druid.frame.allocation.SingleMemoryAllocatorFactory;
 import org.apache.druid.frame.channel.BlockingQueueFrameChannel;
@@ -58,6 +57,7 @@ public class InputChannelsImpl implements InputChannels
   private final FrameProcessorExecutor exec;
   private final String cancellationId;
   private final Map<StagePartition, ReadablePartition> readablePartitionMap;
+  private final boolean removeNullBytes;
 
   public InputChannelsImpl(
       final QueryDefinition queryDefinition,
@@ -65,7 +65,8 @@ public class InputChannelsImpl implements InputChannels
       final InputChannelFactory channelFactory,
       final Supplier<MemoryAllocator> allocatorMaker,
       final FrameProcessorExecutor exec,
-      final String cancellationId
+      final String cancellationId,
+      final boolean removeNullBytes
   )
   {
     this.queryDefinition = queryDefinition;
@@ -74,6 +75,7 @@ public class InputChannelsImpl implements InputChannels
     this.allocatorMaker = allocatorMaker;
     this.exec = exec;
     this.cancellationId = cancellationId;
+    this.removeNullBytes = removeNullBytes;
 
     for (final ReadablePartition readablePartition : readablePartitions) {
       readablePartitionMap.put(
@@ -128,13 +130,13 @@ public class InputChannelsImpl implements InputChannels
           channels,
           stageDefinition.getFrameReader(),
           queueChannel.writable(),
-          FrameWriters.makeFrameWriterFactory(
-              FrameType.ROW_BASED,
+          FrameWriters.makeRowBasedFrameWriterFactory(
               new SingleMemoryAllocatorFactory(allocatorMaker.get()),
               stageDefinition.getFrameReader().signature(),
 
               // No sortColumns, because FrameChannelMerger generates frames that are sorted all on its own
-              Collections.emptyList()
+              Collections.emptyList(),
+              removeNullBytes
           ),
           stageDefinition.getSortKey(),
           null,
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/InvalidNullByteFault.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/InvalidNullByteFault.java
index e66f8cc80c5..6b88daf7599 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/InvalidNullByteFault.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/InvalidNullByteFault.java
@@ -64,7 +64,8 @@ public class InvalidNullByteFault extends BaseMSQFault
     super(
         CODE,
         "Invalid null byte at source[%s], rowNumber[%d], column[%s], value[%s], position[%d]. "
-        + "Consider sanitizing the input string column using REPLACE(\"%s\", U&'\\0000', '') AS %s",
+        + "Consider sanitizing the input string column using \"REPLACE(\"%s\", U&'\\0000', '') AS %s\" or setting 'removeNullBytes' "
+        + "to true in the query context.",
         source,
         rowNumber,
         column,
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/processor/SegmentGeneratorFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/processor/SegmentGeneratorFrameProcessorFactory.java
index e925e1a1c02..3817e63ca49 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/processor/SegmentGeneratorFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/processor/SegmentGeneratorFrameProcessorFactory.java
@@ -124,7 +124,8 @@ public class SegmentGeneratorFrameProcessorFactory
       FrameContext frameContext,
       int maxOutstandingProcessors,
       CounterTracker counters,
-      Consumer<Throwable> warningPublisher
+      Consumer<Throwable> warningPublisher,
+      boolean removeNullBytes
   )
   {
     if (extra == null || extra.isEmpty()) {
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/FrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/FrameProcessorFactory.java
index 87423664fbc..fbf02d46e34 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/FrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/FrameProcessorFactory.java
@@ -74,7 +74,8 @@ public interface FrameProcessorFactory<T, R, ExtraInfoType>
       FrameContext frameContext,
       int maxOutstandingProcessors,
       CounterTracker counters,
-      Consumer<Throwable> warningPublisher
+      Consumer<Throwable> warningPublisher,
+      boolean removeNullBytes
   ) throws IOException;
 
   @Nullable
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/StageDefinition.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/StageDefinition.java
index 80b912faa8d..19a7978abba 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/StageDefinition.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/StageDefinition.java
@@ -27,7 +27,6 @@ import com.google.common.base.Suppliers;
 import it.unimi.dsi.fastutil.ints.IntAVLTreeSet;
 import it.unimi.dsi.fastutil.ints.IntSet;
 import it.unimi.dsi.fastutil.ints.IntSets;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.MemoryAllocator;
 import org.apache.druid.frame.allocation.MemoryAllocatorFactory;
 import org.apache.druid.frame.allocation.SingleMemoryAllocatorFactory;
@@ -355,17 +354,17 @@ public class StageDefinition
    *
    * Calls {@link MemoryAllocatorFactory#newAllocator()} for each frame.
    */
-  public FrameWriterFactory createFrameWriterFactory(final MemoryAllocatorFactory memoryAllocatorFactory)
+  public FrameWriterFactory createFrameWriterFactory(final MemoryAllocatorFactory memoryAllocatorFactory, final boolean removeNullBytes)
   {
-    return FrameWriters.makeFrameWriterFactory(
-        FrameType.ROW_BASED,
+    return FrameWriters.makeRowBasedFrameWriterFactory(
         memoryAllocatorFactory,
         signature,
 
         // Main processor does not sort when there is a hash going on, even if isSort = true. This is because
         // FrameChannelHashPartitioner is expected to be attached to the processor and do the sorting. We don't
         // want to double-sort.
-        doesShuffle() && !shuffleSpec.kind().isHash() ? getClusterBy().getColumns() : Collections.emptyList()
+        doesShuffle() && !shuffleSpec.kind().isHash() ? getClusterBy().getColumns() : Collections.emptyList(),
+        removeNullBytes
     );
   }
 
@@ -374,9 +373,9 @@ public class StageDefinition
    *
    * Re-uses the same {@link MemoryAllocator} for each frame.
    */
-  public FrameWriterFactory createFrameWriterFactory(final MemoryAllocator allocator)
+  public FrameWriterFactory createFrameWriterFactory(final MemoryAllocator allocator, final boolean removeNullBytes)
   {
-    return createFrameWriterFactory(new SingleMemoryAllocatorFactory(allocator));
+    return createFrameWriterFactory(new SingleMemoryAllocatorFactory(allocator), removeNullBytes);
   }
 
   public FrameReader getFrameReader()
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/BaseLeafFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/BaseLeafFrameProcessorFactory.java
index 09c48aa942c..4cf23387633 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/BaseLeafFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/BaseLeafFrameProcessorFactory.java
@@ -87,7 +87,8 @@ public abstract class BaseLeafFrameProcessorFactory extends BaseFrameProcessorFa
       FrameContext frameContext,
       int maxOutstandingProcessors,
       CounterTracker counters,
-      Consumer<Throwable> warningPublisher
+      Consumer<Throwable> warningPublisher,
+      final boolean removeNullBytes
   ) throws IOException
   {
     // BaseLeafFrameProcessorFactory is used for native Druid queries, where the following input cases can happen:
@@ -125,7 +126,7 @@ public abstract class BaseLeafFrameProcessorFactory extends BaseFrameProcessorFa
       final OutputChannel outputChannel = outputChannelFactory.openChannel(0 /* Partition number doesn't matter */);
       outputChannels.add(outputChannel);
       channelQueue.add(outputChannel.getWritableChannel());
-      frameWriterFactoryQueue.add(stageDefinition.createFrameWriterFactory(outputChannel.getFrameMemoryAllocator()));
+      frameWriterFactoryQueue.add(stageDefinition.createFrameWriterFactory(outputChannel.getFrameMemoryAllocator(), removeNullBytes));
     }
 
 
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/WindowOperatorQueryFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/WindowOperatorQueryFrameProcessorFactory.java
index a473ac301f5..fbbc0a0fc3e 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/WindowOperatorQueryFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/WindowOperatorQueryFrameProcessorFactory.java
@@ -119,7 +119,8 @@ public class WindowOperatorQueryFrameProcessorFactory extends BaseFrameProcessor
       FrameContext frameContext,
       int maxOutstandingProcessors,
       CounterTracker counters,
-      Consumer<Throwable> warningPublisher
+      Consumer<Throwable> warningPublisher,
+      final boolean removeNullBytes
   )
   {
     // Expecting a single input slice from some prior stage.
@@ -152,7 +153,7 @@ public class WindowOperatorQueryFrameProcessorFactory extends BaseFrameProcessor
               query,
               readableInput.getChannel(),
               outputChannel.getWritableChannel(),
-              stageDefinition.createFrameWriterFactory(outputChannel.getFrameMemoryAllocator()),
+              stageDefinition.createFrameWriterFactory(outputChannel.getFrameMemoryAllocator(), removeNullBytes),
               readableInput.getChannelFrameReader(),
               frameContext.jsonMapper(),
               operatorList,
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/common/OffsetLimitFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/common/OffsetLimitFrameProcessorFactory.java
index a1241242fb9..d04a75011fa 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/common/OffsetLimitFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/common/OffsetLimitFrameProcessorFactory.java
@@ -95,7 +95,8 @@ public class OffsetLimitFrameProcessorFactory extends BaseFrameProcessorFactory
       FrameContext frameContext,
       int maxOutstandingProcessors,
       CounterTracker counters,
-      Consumer<Throwable> warningPublisher
+      Consumer<Throwable> warningPublisher,
+      boolean removeNullBytes
   ) throws IOException
   {
     if (workerNumber > 0) {
@@ -126,7 +127,7 @@ public class OffsetLimitFrameProcessorFactory extends BaseFrameProcessorFactory
           ReadableConcatFrameChannel.open(Iterators.transform(readableInputs.iterator(), ReadableInput::getChannel)),
           outputChannel.getWritableChannel(),
           readableInputs.frameReader(),
-          stageDefinition.createFrameWriterFactory(HeapMemoryAllocator.unlimited()),
+          stageDefinition.createFrameWriterFactory(HeapMemoryAllocator.unlimited(), removeNullBytes),
           offset,
           // Limit processor will add limit + offset at various points; must avoid overflow
           limit == null ? Long.MAX_VALUE - offset : limit
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/common/SortMergeJoinFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/common/SortMergeJoinFrameProcessorFactory.java
index 7a81c59cc11..9eb95a468fd 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/common/SortMergeJoinFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/common/SortMergeJoinFrameProcessorFactory.java
@@ -134,7 +134,8 @@ public class SortMergeJoinFrameProcessorFactory extends BaseFrameProcessorFactor
       FrameContext frameContext,
       int maxOutstandingProcessors,
       CounterTracker counters,
-      Consumer<Throwable> warningPublisher
+      Consumer<Throwable> warningPublisher,
+      boolean removeNullBytes
   ) throws IOException
   {
     if (inputSlices.size() != 2 || !inputSlices.stream().allMatch(slice -> slice instanceof StageInputSlice)) {
@@ -180,7 +181,7 @@ public class SortMergeJoinFrameProcessorFactory extends BaseFrameProcessorFactor
               readableInputs.get(LEFT),
               readableInputs.get(RIGHT),
               outputChannel.getWritableChannel(),
-              stageDefinition.createFrameWriterFactory(outputChannel.getFrameMemoryAllocator()),
+              stageDefinition.createFrameWriterFactory(outputChannel.getFrameMemoryAllocator(), removeNullBytes),
               rightPrefix,
               keyColumns,
               requiredNonNullKeyParts,
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessorFactory.java
index c74b7ea246f..851fc21c52e 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessorFactory.java
@@ -81,7 +81,8 @@ public class GroupByPostShuffleFrameProcessorFactory extends BaseFrameProcessorF
       FrameContext frameContext,
       int maxOutstandingProcessors,
       CounterTracker counters,
-      Consumer<Throwable> warningPublisher
+      Consumer<Throwable> warningPublisher,
+      boolean removeNullBytes
   )
   {
     // Expecting a single input slice from some prior stage.
@@ -116,7 +117,7 @@ public class GroupByPostShuffleFrameProcessorFactory extends BaseFrameProcessorF
               engine,
               readableInput.getChannel(),
               outputChannel.getWritableChannel(),
-              stageDefinition.createFrameWriterFactory(outputChannel.getFrameMemoryAllocator()),
+              stageDefinition.createFrameWriterFactory(outputChannel.getFrameMemoryAllocator(), removeNullBytes),
               readableInput.getChannelFrameReader(),
               frameContext.jsonMapper()
           );
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactory.java
index af4038cd247..930ba886155 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/ExportResultsFrameProcessorFactory.java
@@ -128,7 +128,8 @@ public class ExportResultsFrameProcessorFactory implements FrameProcessorFactory
       FrameContext frameContext,
       int maxOutstandingProcessors,
       CounterTracker counters,
-      Consumer<Throwable> warningPublisher
+      Consumer<Throwable> warningPublisher,
+      boolean removeNullBytes
   )
   {
     final StageInputSlice slice = (StageInputSlice) CollectionUtils.getOnlyElement(
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/QueryResultFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/QueryResultFrameProcessorFactory.java
index 535819aff52..17fc6c94817 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/QueryResultFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/results/QueryResultFrameProcessorFactory.java
@@ -68,7 +68,8 @@ public class QueryResultFrameProcessorFactory extends BaseFrameProcessorFactory
       FrameContext frameContext,
       int maxOutstandingProcessors,
       CounterTracker counters,
-      Consumer<Throwable> warningPublisher
+      Consumer<Throwable> warningPublisher,
+      boolean removeNullBytes
   )
   {
     // Expecting a single input slice from some prior stage.
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
index 4b599cd32d5..d001e0177a6 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
@@ -137,7 +137,10 @@ public class MultiStageQueryContext
   public static final int DEFAULT_ROWS_PER_SEGMENT = 3000000;
 
   public static final String CTX_ROWS_PER_PAGE = "rowsPerPage";
-  static final int DEFAULT_ROWS_PER_PAGE = 100000;
+  public static final int DEFAULT_ROWS_PER_PAGE = 100000;
+
+  public static final String CTX_REMOVE_NULL_BYTES = "removeNullBytes";
+  public static final boolean DEFAULT_REMOVE_NULL_BYTES = false;
 
   public static final String CTX_ROWS_IN_MEMORY = "rowsInMemory";
   // Lower than the default to minimize the impact of per-row overheads that are not accounted for by
@@ -291,6 +294,11 @@ public class MultiStageQueryContext
     );
   }
 
+  public static boolean removeNullBytes(final QueryContext queryContext)
+  {
+    return queryContext.getBoolean(CTX_REMOVE_NULL_BYTES, DEFAULT_REMOVE_NULL_BYTES);
+  }
+
 
   public static MSQSelectDestination getSelectDestination(final QueryContext queryContext)
   {
@@ -362,7 +370,9 @@ public class MultiStageQueryContext
       try {
         // Not caching this ObjectMapper in a static, because we expect to use it infrequently (once per INSERT
         // query that uses this feature) and there is no need to keep it around longer than that.
-        return new ObjectMapper().readValue(listString, new TypeReference<List<String>>() {});
+        return new ObjectMapper().readValue(listString, new TypeReference<List<String>>()
+        {
+        });
       }
       catch (JsonProcessingException e) {
         throw QueryContexts.badValueException(keyName, "CSV or JSON array", listString);
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQParseExceptionsTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQParseExceptionsTest.java
index e1d0520362b..330f1cdbbe6 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQParseExceptionsTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQParseExceptionsTest.java
@@ -32,6 +32,7 @@ import org.apache.druid.msq.indexing.error.CannotParseExternalDataFault;
 import org.apache.druid.msq.indexing.error.InvalidNullByteFault;
 import org.apache.druid.msq.querykit.scan.ExternalColumnSelectorFactory;
 import org.apache.druid.msq.test.MSQTestBase;
+import org.apache.druid.msq.util.MultiStageQueryContext;
 import org.apache.druid.query.dimension.DefaultDimensionSpec;
 import org.apache.druid.query.groupby.GroupByQuery;
 import org.apache.druid.query.scan.ScanQuery;
@@ -231,6 +232,99 @@ public class MSQParseExceptionsTest extends MSQTestBase
         .verifyResults();
   }
 
+  @Test
+  public void testIngestWithSanitizedNullByteUsingContextParameter() throws IOException
+  {
+    final File toRead = getResourceAsTemporaryFile("/unparseable-null-byte-string.csv");
+    final String toReadAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
+
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("agent_category", ColumnType.STRING)
+                                            .build();
+
+    Map<String, Object> context = new HashMap<>(DEFAULT_MSQ_CONTEXT);
+    context.put("sqlInsertSegmentGranularity", "{\"type\":\"all\"}");
+    context.put(MultiStageQueryContext.CTX_REMOVE_NULL_BYTES, true);
+
+    Map<String, Object> runtimeContext = new HashMap<>(DEFAULT_MSQ_CONTEXT);
+    runtimeContext.put(MultiStageQueryContext.CTX_REMOVE_NULL_BYTES, true);
+
+    final ScanQuery expectedQuery =
+        newScanQueryBuilder()
+            .dataSource(
+                new ExternalDataSource(
+                    new LocalInputSource(null, null, ImmutableList.of(toRead), SystemFields.none()),
+                    new CsvInputFormat(null, null, null, true, 0),
+                    RowSignature.builder()
+                                .add("timestamp", ColumnType.STRING)
+                                .add("agent_category", ColumnType.STRING)
+                                .add("agent_type", ColumnType.STRING)
+                                .add("browser", ColumnType.STRING)
+                                .build()
+                )
+            )
+            .intervals(querySegmentSpec(Filtration.eternity()))
+            .virtualColumns(
+                expressionVirtualColumn(
+                    "v0",
+                    "timestamp_floor(timestamp_parse(\"timestamp\",null,'UTC'),'PT1M',null,'UTC')",
+                    ColumnType.LONG
+                )
+            )
+            .columns("agent_category", "v0")
+            .resultFormat(ScanQuery.ResultFormat.RESULT_FORMAT_COMPACTED_LIST)
+            .context(defaultScanQueryContext(
+                context,
+                RowSignature.builder()
+                            .add("agent_category", ColumnType.STRING)
+                            .add("v0", ColumnType.LONG)
+                            .build()
+            ))
+            .build();
+
+
+    testIngestQuery()
+        .setSql("INSERT INTO foo1\n"
+                + "WITH\n"
+                + "kttm_data AS (\n"
+                + "SELECT * FROM TABLE(\n"
+                + "  EXTERN(\n"
+                + "    '{ \"files\": [" + toReadAsJson + "],\"type\":\"local\"}',\n"
+                + "    '{\"type\":\"csv\", \"findColumnsFromHeader\":true}',\n"
+                + "    '[{\"name\":\"timestamp\",\"type\":\"string\"},{\"name\":\"agent_category\",\"type\":\"string\"},{\"name\":\"agent_type\",\"type\":\"string\"},{\"name\":\"browser\",\"type\":\"string\"}]'\n"
+                + "  )\n"
+                + "))\n"
+                + "\n"
+                + "SELECT\n"
+                + "  FLOOR(TIME_PARSE(\"timestamp\") TO MINUTE) AS __time,\n"
+                + "  agent_category\n"
+                + "FROM kttm_data\n"
+                + "PARTITIONED BY ALL")
+        .setExpectedRowSignature(rowSignature)
+        .setExpectedResultRows(ImmutableList.of(
+            new Object[]{1566691200000L, "Personal computer"},
+            new Object[]{1566691200000L, "Personal computer"},
+            new Object[]{1566691200000L, "Smartphone"}
+        ))
+        .setExpectedDataSource("foo1")
+        .setExpectedMSQSpec(
+            MSQSpec
+                .builder()
+                .query(expectedQuery)
+                .columnMappings(new ColumnMappings(
+                    ImmutableList.of(
+                        new ColumnMapping("v0", "__time"),
+                        new ColumnMapping("agent_category", "agent_category")
+                    )
+                ))
+                .destination(new DataSourceMSQDestination("foo1", Granularities.ALL, null, null))
+                .tuningConfig(MSQTuningConfig.defaultConfig())
+                .build())
+        .setQueryContext(runtimeContext)
+        .verifyResults();
+  }
+
   @Test
   public void testMultiValueStringWithIncorrectType() throws IOException
   {
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/common/SortMergeJoinFrameProcessorTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/common/SortMergeJoinFrameProcessorTest.java
index 20e4d487107..0094aeb7369 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/common/SortMergeJoinFrameProcessorTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/common/SortMergeJoinFrameProcessorTest.java
@@ -1570,11 +1570,11 @@ public class SortMergeJoinFrameProcessorTest extends InitializedNullHandlingTest
   private FrameWriterFactory makeFrameWriterFactory(final RowSignature signature)
   {
     return new LimitedFrameWriterFactory(
-        FrameWriters.makeFrameWriterFactory(
-            FrameType.ROW_BASED,
+        FrameWriters.makeRowBasedFrameWriterFactory(
             new SingleMemoryAllocatorFactory(ArenaMemoryAllocator.createOnHeap(1_000_000)),
             signature,
-            Collections.emptyList()
+            Collections.emptyList(),
+            false
         ),
         rowsPerOutputFrame
     );
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorTest.java
index de6d6a65fe6..a6844fcabff 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorTest.java
@@ -115,11 +115,11 @@ public class ScanQueryFrameProcessorTest extends InitializedNullHandlingTest
 
     // Limit output frames to 1 row to ensure we test edge cases
     final FrameWriterFactory frameWriterFactory = new LimitedFrameWriterFactory(
-        FrameWriters.makeFrameWriterFactory(
-            FrameType.ROW_BASED,
+        FrameWriters.makeRowBasedFrameWriterFactory(
             new SingleMemoryAllocatorFactory(HeapMemoryAllocator.unlimited()),
             signature,
-            Collections.emptyList()
+            Collections.emptyList(),
+            false
         ),
         1
     );
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/util/MultiStageQueryContextTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/util/MultiStageQueryContextTest.java
index 9f24a8b4331..af08acf6ab7 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/util/MultiStageQueryContextTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/util/MultiStageQueryContextTest.java
@@ -47,6 +47,7 @@ import static org.apache.druid.msq.util.MultiStageQueryContext.CTX_FAULT_TOLERAN
 import static org.apache.druid.msq.util.MultiStageQueryContext.CTX_FINALIZE_AGGREGATIONS;
 import static org.apache.druid.msq.util.MultiStageQueryContext.CTX_MAX_NUM_TASKS;
 import static org.apache.druid.msq.util.MultiStageQueryContext.CTX_MSQ_MODE;
+import static org.apache.druid.msq.util.MultiStageQueryContext.CTX_REMOVE_NULL_BYTES;
 import static org.apache.druid.msq.util.MultiStageQueryContext.CTX_ROWS_IN_MEMORY;
 import static org.apache.druid.msq.util.MultiStageQueryContext.CTX_ROWS_PER_SEGMENT;
 import static org.apache.druid.msq.util.MultiStageQueryContext.CTX_SORT_ORDER;
@@ -248,6 +249,24 @@ public class MultiStageQueryContextTest
     );
   }
 
+  @Test
+  public void removeNullBytes_unset_returnsDefaultValue()
+  {
+    Assert.assertFalse(MultiStageQueryContext.removeNullBytes(QueryContext.empty()));
+  }
+
+  @Test
+  public void removeNullBytes_set_returnsCorrectValue()
+  {
+    Assert.assertTrue(
+        MultiStageQueryContext.removeNullBytes(QueryContext.of(ImmutableMap.of(CTX_REMOVE_NULL_BYTES, true)))
+    );
+
+    Assert.assertFalse(
+        MultiStageQueryContext.removeNullBytes(QueryContext.of(ImmutableMap.of(CTX_REMOVE_NULL_BYTES, false)))
+    );
+  }
+
   @Test
   public void testDecodeSortOrder()
   {
diff --git a/processing/src/main/java/org/apache/druid/frame/allocation/MemoryAllocatorFactory.java b/processing/src/main/java/org/apache/druid/frame/allocation/MemoryAllocatorFactory.java
index edb74ef19f9..cec34518306 100644
--- a/processing/src/main/java/org/apache/druid/frame/allocation/MemoryAllocatorFactory.java
+++ b/processing/src/main/java/org/apache/druid/frame/allocation/MemoryAllocatorFactory.java
@@ -22,7 +22,7 @@ package org.apache.druid.frame.allocation;
 /**
  * Factory for {@link MemoryAllocator}.
  *
- * Used by {@link org.apache.druid.frame.write.FrameWriters#makeFrameWriterFactory} to create
+ * Used by {@link org.apache.druid.frame.write.FrameWriters#makeRowBasedFrameWriterFactory} to create
  * {@link org.apache.druid.frame.write.FrameWriterFactory}.
  */
 public interface MemoryAllocatorFactory
diff --git a/processing/src/main/java/org/apache/druid/frame/field/FieldWriters.java b/processing/src/main/java/org/apache/druid/frame/field/FieldWriters.java
index cc7f68d099d..028c9fd39c5 100644
--- a/processing/src/main/java/org/apache/druid/frame/field/FieldWriters.java
+++ b/processing/src/main/java/org/apache/druid/frame/field/FieldWriters.java
@@ -56,7 +56,8 @@ public class FieldWriters
   public static FieldWriter create(
       final ColumnSelectorFactory columnSelectorFactory,
       final String columnName,
-      final ColumnType columnType
+      final ColumnType columnType,
+      final boolean removeNullBytes
   )
   {
     if (columnType == null) {
@@ -74,7 +75,7 @@ public class FieldWriters
         return makeDoubleWriter(columnSelectorFactory, columnName);
 
       case STRING:
-        return makeStringWriter(columnSelectorFactory, columnName);
+        return makeStringWriter(columnSelectorFactory, columnName, removeNullBytes);
 
       case COMPLEX:
         return makeComplexWriter(columnSelectorFactory, columnName, columnType.getComplexTypeName());
@@ -82,7 +83,7 @@ public class FieldWriters
       case ARRAY:
         switch (columnType.getElementType().getType()) {
           case STRING:
-            return makeStringArrayWriter(columnSelectorFactory, columnName);
+            return makeStringArrayWriter(columnSelectorFactory, columnName, removeNullBytes);
           case LONG:
             return makeLongArrayWriter(columnSelectorFactory, columnName);
           case FLOAT:
@@ -124,20 +125,22 @@ public class FieldWriters
 
   private static FieldWriter makeStringWriter(
       final ColumnSelectorFactory selectorFactory,
-      final String columnName
+      final String columnName,
+      final boolean removeNullBytes
   )
   {
     final DimensionSelector selector = selectorFactory.makeDimensionSelector(DefaultDimensionSpec.of(columnName));
-    return new StringFieldWriter(selector);
+    return new StringFieldWriter(selector, removeNullBytes);
   }
 
   private static FieldWriter makeStringArrayWriter(
       final ColumnSelectorFactory selectorFactory,
-      final String columnName
+      final String columnName,
+      final boolean removeNullBytes
   )
   {
     final ColumnValueSelector<?> selector = selectorFactory.makeColumnValueSelector(columnName);
-    return new StringArrayFieldWriter(selector);
+    return new StringArrayFieldWriter(selector, removeNullBytes);
   }
 
   private static FieldWriter makeLongArrayWriter(
diff --git a/processing/src/main/java/org/apache/druid/frame/field/StringArrayFieldWriter.java b/processing/src/main/java/org/apache/druid/frame/field/StringArrayFieldWriter.java
index d6faed0ae9f..8b17e3241c8 100644
--- a/processing/src/main/java/org/apache/druid/frame/field/StringArrayFieldWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/field/StringArrayFieldWriter.java
@@ -33,10 +33,12 @@ import org.apache.druid.segment.ColumnValueSelector;
 public class StringArrayFieldWriter implements FieldWriter
 {
   private final BaseObjectColumnValueSelector<?> selector;
+  private final boolean removeNullBytes;
 
-  public StringArrayFieldWriter(final BaseObjectColumnValueSelector<?> selector)
+  public StringArrayFieldWriter(final BaseObjectColumnValueSelector<?> selector, final boolean removeNullBytes)
   {
     this.selector = selector;
+    this.removeNullBytes = removeNullBytes;
   }
 
   @Override
@@ -46,7 +48,8 @@ public class StringArrayFieldWriter implements FieldWriter
         memory,
         position,
         maxSize,
-        FrameWriterUtils.getUtf8ByteBuffersFromStringArraySelector(selector)
+        FrameWriterUtils.getUtf8ByteBuffersFromStringArraySelector(selector),
+        removeNullBytes
     );
   }
 
diff --git a/processing/src/main/java/org/apache/druid/frame/field/StringFieldWriter.java b/processing/src/main/java/org/apache/druid/frame/field/StringFieldWriter.java
index 8513210c0aa..2ffb79a12da 100644
--- a/processing/src/main/java/org/apache/druid/frame/field/StringFieldWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/field/StringFieldWriter.java
@@ -55,17 +55,19 @@ public class StringFieldWriter implements FieldWriter
   private static final byte NULL_ROW_SIZE = 2; // NULL_ROW + ROW_TERMINATOR
 
   private final DimensionSelector selector;
+  private final boolean removeNullBytes;
 
-  public StringFieldWriter(final DimensionSelector selector)
+  public StringFieldWriter(final DimensionSelector selector, final boolean removeNullbytes)
   {
     this.selector = selector;
+    this.removeNullBytes = removeNullbytes;
   }
 
   @Override
   public long writeTo(final WritableMemory memory, final long position, final long maxSize)
   {
     final List<ByteBuffer> byteBuffers = FrameWriterUtils.getUtf8ByteBuffersFromStringSelector(selector, true);
-    return writeUtf8ByteBuffers(memory, position, maxSize, byteBuffers);
+    return writeUtf8ByteBuffers(memory, position, maxSize, byteBuffers, removeNullBytes);
   }
 
   @Override
@@ -89,7 +91,8 @@ public class StringFieldWriter implements FieldWriter
       final WritableMemory memory,
       final long position,
       final long maxSize,
-      @Nullable final List<ByteBuffer> byteBuffers
+      @Nullable final List<ByteBuffer> byteBuffers,
+      final boolean removeNullBytes
   )
   {
     if (byteBuffers == null) {
@@ -125,7 +128,13 @@ public class StringFieldWriter implements FieldWriter
         written++;
 
         if (len > 0) {
-          FrameWriterUtils.copyByteBufferToMemory(utf8Datum, memory, position + written, len, false);
+          FrameWriterUtils.copyByteBufferToMemoryDisallowingNullBytes(
+              utf8Datum,
+              memory,
+              position + written,
+              len,
+              removeNullBytes
+          );
           written += len;
         }
       }
diff --git a/processing/src/main/java/org/apache/druid/frame/processor/SuperSorter.java b/processing/src/main/java/org/apache/druid/frame/processor/SuperSorter.java
index 440da49d7c2..164bcdb9559 100644
--- a/processing/src/main/java/org/apache/druid/frame/processor/SuperSorter.java
+++ b/processing/src/main/java/org/apache/druid/frame/processor/SuperSorter.java
@@ -37,7 +37,6 @@ import it.unimi.dsi.fastutil.longs.LongRBTreeSet;
 import it.unimi.dsi.fastutil.longs.LongSortedSet;
 import org.apache.druid.common.guava.FutureUtils;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.MemoryAllocatorFactory;
 import org.apache.druid.frame.allocation.SingleMemoryAllocatorFactory;
 import org.apache.druid.frame.channel.BlockingQueueFrameChannel;
@@ -129,6 +128,7 @@ public class SuperSorter
   private final int maxActiveProcessors;
   private final long rowLimit;
   private final String cancellationId;
+  private final boolean removeNullBytes;
 
   private final Object runWorkersLock = new Object();
 
@@ -219,7 +219,8 @@ public class SuperSorter
       final int maxChannelsPerProcessor,
       final long rowLimit,
       @Nullable final String cancellationId,
-      final SuperSorterProgressTracker superSorterProgressTracker
+      final SuperSorterProgressTracker superSorterProgressTracker,
+      final boolean removeNullBytes
   )
   {
     this.inputChannels = inputChannels;
@@ -234,6 +235,7 @@ public class SuperSorter
     this.rowLimit = rowLimit;
     this.cancellationId = cancellationId;
     this.superSorterProgressTracker = superSorterProgressTracker;
+    this.removeNullBytes = removeNullBytes;
 
     for (int i = 0; i < inputChannels.size(); i++) {
       inputChannelsToRead.add(i);
@@ -623,12 +625,13 @@ public class SuperSorter
               in,
               frameReader,
               writableChannel,
-              FrameWriters.makeFrameWriterFactory(
-                  FrameType.ROW_BASED, // Row-based frames are generally preferred as inputs to mergers
+              FrameWriters.makeRowBasedFrameWriterFactory(
+                  // Row-based frames are generally preferred as inputs to mergers
                   frameAllocatorFactory,
                   frameReader.signature(),
                   // No sortColumns, because FrameChannelMerger generates frames that are sorted all on its own
-                  Collections.emptyList()
+                  Collections.emptyList(),
+                  removeNullBytes
               ),
               sortKey,
               partitions,
diff --git a/processing/src/main/java/org/apache/druid/frame/write/FrameWriter.java b/processing/src/main/java/org/apache/druid/frame/write/FrameWriter.java
index 050bb6513d2..70c892ef33e 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/FrameWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/FrameWriter.java
@@ -28,7 +28,7 @@ import java.nio.ByteOrder;
 /**
  * Writer for {@link org.apache.druid.frame.Frame}. See that class for format information.
  *
- * Generally obtained through a {@link FrameWriters#makeFrameWriterFactory}
+ * Generally obtained through a {@link FrameWriters#makeRowBasedFrameWriterFactory}
  */
 public interface FrameWriter extends Closeable
 {
diff --git a/processing/src/main/java/org/apache/druid/frame/write/FrameWriterUtils.java b/processing/src/main/java/org/apache/druid/frame/write/FrameWriterUtils.java
index 0b497b545ac..d857cf33e03 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/FrameWriterUtils.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/FrameWriterUtils.java
@@ -242,16 +242,48 @@ public class FrameWriterUtils
   }
 
   /**
-   * Copies "len" bytes from {@code src.position()} to "dstPosition" in "memory". Does not update the position of src.
-   *
-   * @throws InvalidNullByteException if "allowNullBytes" is false and a null byte is encountered
+   * Copies {@code src} to {@code dst} without making any modification to the source data.
    */
-  public static void copyByteBufferToMemory(
+  public static void copyByteBufferToMemoryAllowingNullBytes(
+      final ByteBuffer src,
+      final WritableMemory dst,
+      final long dstPosition,
+      final int len
+  )
+  {
+    copyByteBufferToMemory(src, dst, dstPosition, len, true, false);
+  }
+
+  /**
+   * Copies {@code src} to {@code dst}, disallowing null bytes to be written to the destination. If {@code removeNullBytes}
+   * is true, the method will drop the null bytes, and if it is false, the method will throw an exception.
+   */
+  public static void copyByteBufferToMemoryDisallowingNullBytes(
       final ByteBuffer src,
       final WritableMemory dst,
       final long dstPosition,
       final int len,
-      final boolean allowNullBytes
+      final boolean removeNullBytes
+  )
+  {
+    copyByteBufferToMemory(src, dst, dstPosition, len, false, removeNullBytes);
+  }
+
+  /**
+   * Copies "len" bytes from {@code src.position()} to "dstPosition" in "memory". Does not update the position of src.
+   * <p>
+   * Whenever "allowNullBytes" is true, "removeNullBytes" must be false. Use the methods {@link #copyByteBufferToMemoryAllowingNullBytes}
+   * and {@link #copyByteBufferToMemoryDisallowingNullBytes} to copy between the memory
+   * <p>
+   * @throws InvalidNullByteException if "allowNullBytes" and "removeNullBytes" is false and a null byte is encountered
+   */
+  private static void copyByteBufferToMemory(
+      final ByteBuffer src,
+      final WritableMemory dst,
+      final long dstPosition,
+      final int len,
+      final boolean allowNullBytes,
+      final boolean removeNullBytes
   )
   {
     if (src.remaining() < len) {
@@ -262,21 +294,39 @@ public class FrameWriterUtils
     }
 
     final int srcEnd = src.position() + len;
-    long q = dstPosition;
 
-    for (int p = src.position(); p < srcEnd; p++, q++) {
-      final byte b = src.get(p);
-
-      if (!allowNullBytes && b == 0) {
-        ByteBuffer duplicate = src.duplicate();
-        duplicate.limit(srcEnd);
-        throw InvalidNullByteException.builder()
-                                      .value(StringUtils.fromUtf8(duplicate))
-                                      .position(p - src.position())
-                                      .build();
+    if (allowNullBytes) {
+      if (src.hasArray()) {
+        // Null bytes are ignored and the src buffer is backed by an array. Bulk copying to the destination would be the fastest
+        dst.putByteArray(dstPosition, src.array(), src.arrayOffset() + src.position(), len);
+      } else {
+        // Null bytes are ignored and the src buffer is not backed by an array. We can copy the byte buffer to the destination individually
+        long q = dstPosition;
+        for (int p = src.position(); p < srcEnd; p++, q++) {
+          final byte b = src.get(p);
+          dst.putByte(q, b);
+        }
       }
+    } else {
+      long q = dstPosition;
+      for (int p = src.position(); p < srcEnd; p++) {
+        final byte b = src.get(p);
 
-      dst.putByte(q, b);
+        if (b == 0) {
+          if (!removeNullBytes) {
+            // Cannot ignore the null byte, but cannot remove them as well. Therefore, throw an error.
+            ByteBuffer duplicate = src.duplicate();
+            duplicate.limit(srcEnd);
+            throw InvalidNullByteException.builder()
+                                          .value(StringUtils.fromUtf8(duplicate))
+                                          .position(p - src.position())
+                                          .build();
+          }
+        } else {
+          dst.putByte(q, b);
+          q++;
+        }
+      }
     }
   }
 
diff --git a/processing/src/main/java/org/apache/druid/frame/write/FrameWriters.java b/processing/src/main/java/org/apache/druid/frame/write/FrameWriters.java
index 4993cf9b2dc..186d05460c3 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/FrameWriters.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/FrameWriters.java
@@ -19,13 +19,10 @@
 
 package org.apache.druid.frame.write;
 
-import com.google.common.base.Preconditions;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.MemoryAllocatorFactory;
 import org.apache.druid.frame.key.KeyColumn;
 import org.apache.druid.frame.write.columnar.ColumnarFrameWriterFactory;
 import org.apache.druid.java.util.common.IAE;
-import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.RowSignature;
 
@@ -47,28 +44,29 @@ public class FrameWriters
   /**
    * Creates a {@link FrameWriterFactory}.
    *
-   * @param frameType        type of the frames
    * @param allocatorFactory supplier of allocators, which ultimately determine frame size. Frames are closed and
    *                         written once the allocator runs out of memory.
    * @param signature        signature of the frames
    * @param sortColumns      sort columns for the frames. If nonempty, {@link FrameSort#sort} is used to sort the
    *                         resulting frames.
    */
-  public static FrameWriterFactory makeFrameWriterFactory(
-      final FrameType frameType,
+  public static FrameWriterFactory makeRowBasedFrameWriterFactory(
+      final MemoryAllocatorFactory allocatorFactory,
+      final RowSignature signature,
+      final List<KeyColumn> sortColumns,
+      final boolean removeNullBytes
+  )
+  {
+    return new RowBasedFrameWriterFactory(allocatorFactory, signature, sortColumns, removeNullBytes);
+  }
+
+  public static FrameWriterFactory makeColumnBasedFrameWriterFactory(
       final MemoryAllocatorFactory allocatorFactory,
       final RowSignature signature,
       final List<KeyColumn> sortColumns
   )
   {
-    switch (Preconditions.checkNotNull(frameType, "frameType")) {
-      case COLUMNAR:
-        return new ColumnarFrameWriterFactory(allocatorFactory, signature, sortColumns);
-      case ROW_BASED:
-        return new RowBasedFrameWriterFactory(allocatorFactory, signature, sortColumns);
-      default:
-        throw new ISE("Unrecognized frame type [%s]", frameType);
-    }
+    return new ColumnarFrameWriterFactory(allocatorFactory, signature, sortColumns);
   }
 
   /**
diff --git a/processing/src/main/java/org/apache/druid/frame/write/RowBasedFrameWriterFactory.java b/processing/src/main/java/org/apache/druid/frame/write/RowBasedFrameWriterFactory.java
index 720d808bf32..d5fca90aa8c 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/RowBasedFrameWriterFactory.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/RowBasedFrameWriterFactory.java
@@ -40,16 +40,19 @@ public class RowBasedFrameWriterFactory implements FrameWriterFactory
   private final MemoryAllocatorFactory allocatorFactory;
   private final RowSignature signature;
   private final List<KeyColumn> sortColumns;
+  private final boolean removeNullBytes;
 
   public RowBasedFrameWriterFactory(
       final MemoryAllocatorFactory allocatorFactory,
       final RowSignature signature,
-      final List<KeyColumn> sortColumns
+      final List<KeyColumn> sortColumns,
+      final boolean removeNullBytes
   )
   {
     this.allocatorFactory = allocatorFactory;
     this.signature = signature;
     this.sortColumns = sortColumns;
+    this.removeNullBytes = removeNullBytes;
 
     FrameWriterUtils.verifySortColumns(sortColumns, signature);
   }
@@ -70,7 +73,7 @@ public class RowBasedFrameWriterFactory implements FrameWriterFactory
     return new RowBasedFrameWriter(
         signature,
         sortColumns,
-        makeFieldWriters(columnSelectorFactory),
+        makeFieldWriters(columnSelectorFactory, removeNullBytes),
         FrameReaderUtils.makeRowMemorySupplier(columnSelectorFactory, signature),
         rowOrderMemory,
         rowOffsetMemory,
@@ -102,7 +105,7 @@ public class RowBasedFrameWriterFactory implements FrameWriterFactory
    * The returned {@link FieldWriter} objects are not thread-safe, and should only be used with a
    * single frame writer.
    */
-  private List<FieldWriter> makeFieldWriters(final ColumnSelectorFactory columnSelectorFactory)
+  private List<FieldWriter> makeFieldWriters(final ColumnSelectorFactory columnSelectorFactory, final boolean removeNullBytes)
   {
     final List<FieldWriter> fieldWriters = new ArrayList<>();
 
@@ -111,7 +114,7 @@ public class RowBasedFrameWriterFactory implements FrameWriterFactory
         final String column = signature.getColumnName(i);
         // note: null type won't work, but we'll get a nice error from FrameColumnWriters.create
         final ColumnType columnType = signature.getColumnType(i).orElse(null);
-        fieldWriters.add(FieldWriters.create(columnSelectorFactory, column, columnType));
+        fieldWriters.add(FieldWriters.create(columnSelectorFactory, column, columnType, removeNullBytes));
       }
     }
     catch (Throwable e) {
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/StringFrameColumnWriter.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/StringFrameColumnWriter.java
index ec812d9654c..8eee0fd0cef 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/columnar/StringFrameColumnWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/StringFrameColumnWriter.java
@@ -164,12 +164,11 @@ public abstract class StringFrameColumnWriter<T extends ColumnValueSelector> imp
         assert stringDataCursor != null; // Won't be null when len > 0, since utf8DataByteLength would be > 0.
 
         // Since we allow null bytes, this call wouldn't throw InvalidNullByteException
-        FrameWriterUtils.copyByteBufferToMemory(
+        FrameWriterUtils.copyByteBufferToMemoryAllowingNullBytes(
             utf8Datum,
             stringDataCursor.memory(),
             stringDataCursor.start() + lastStringLength,
-            len,
-            true
+            len
         );
       }
 
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java
index 47064fefbe6..7588848cf5b 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java
@@ -38,7 +38,6 @@ import com.google.inject.Inject;
 import org.apache.druid.data.input.Row;
 import org.apache.druid.error.DruidException;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.MemoryAllocatorFactory;
 import org.apache.druid.frame.segment.FrameCursorUtils;
 import org.apache.druid.frame.write.FrameWriterFactory;
@@ -817,8 +816,7 @@ public class GroupByQueryQueryToolChest extends QueryToolChest<ResultRow, GroupB
                                         ? FrameWriterUtils.replaceUnknownTypesWithNestedColumns(rowSignature)
                                         : rowSignature;
 
-    FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
-        FrameType.COLUMNAR,
+    FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
         memoryAllocatorFactory,
         modifiedRowSignature,
         new ArrayList<>()
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/LazilyDecoratedRowsAndColumns.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/LazilyDecoratedRowsAndColumns.java
index 6c2647aaf76..0dae40467f3 100644
--- a/processing/src/main/java/org/apache/druid/query/rowsandcols/LazilyDecoratedRowsAndColumns.java
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/LazilyDecoratedRowsAndColumns.java
@@ -21,7 +21,6 @@ package org.apache.druid.query.rowsandcols;
 
 import com.google.common.collect.ImmutableList;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.ArenaMemoryAllocatorFactory;
 import org.apache.druid.frame.key.KeyColumn;
 import org.apache.druid.frame.key.KeyOrder;
@@ -275,8 +274,7 @@ public class LazilyDecoratedRowsAndColumns implements RowsAndColumns
         }
       }
 
-      final FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
-          FrameType.COLUMNAR,
+      final FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
           new ArenaMemoryAllocatorFactory(200 << 20), // 200 MB, because, why not?
           signature,
           sortColumns
@@ -392,8 +390,7 @@ public class LazilyDecoratedRowsAndColumns implements RowsAndColumns
     long remainingRowsToSkip = limit.getOffset();
     long remainingRowsToFetch = limit.getLimitOrMax();
 
-    final FrameWriter frameWriter = FrameWriters.makeFrameWriterFactory(
-        FrameType.COLUMNAR,
+    final FrameWriter frameWriter = FrameWriters.makeColumnBasedFrameWriterFactory(
         memFactory,
         sigBob.build(),
         Collections.emptyList()
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/StorageAdapterRowsAndColumns.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/StorageAdapterRowsAndColumns.java
index bcc1d075cbe..edc6518ca04 100644
--- a/processing/src/main/java/org/apache/druid/query/rowsandcols/StorageAdapterRowsAndColumns.java
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/StorageAdapterRowsAndColumns.java
@@ -20,7 +20,6 @@
 package org.apache.druid.query.rowsandcols;
 
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.ArenaMemoryAllocatorFactory;
 import org.apache.druid.frame.write.FrameWriter;
 import org.apache.druid.frame.write.FrameWriterFactory;
@@ -119,8 +118,7 @@ public class StorageAdapterRowsAndColumns implements CloseableShapeshifter, Rows
 
       final ColumnSelectorFactory columnSelectorFactory = in.getColumnSelectorFactory();
 
-      final FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
-          FrameType.COLUMNAR,
+      final FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
           new ArenaMemoryAllocatorFactory(200 << 20), // 200 MB, because, why not?
           rowSignature,
           Collections.emptyList()
diff --git a/processing/src/main/java/org/apache/druid/query/scan/ScanResultValueFramesIterable.java b/processing/src/main/java/org/apache/druid/query/scan/ScanResultValueFramesIterable.java
index 2f3b988d34a..b5fd9d1fd2f 100644
--- a/processing/src/main/java/org/apache/druid/query/scan/ScanResultValueFramesIterable.java
+++ b/processing/src/main/java/org/apache/druid/query/scan/ScanResultValueFramesIterable.java
@@ -26,7 +26,6 @@ import it.unimi.dsi.fastutil.ints.IntArrayList;
 import it.unimi.dsi.fastutil.ints.IntList;
 import org.apache.druid.error.DruidException;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.MemoryAllocatorFactory;
 import org.apache.druid.frame.segment.FrameCursorUtils;
 import org.apache.druid.frame.write.FrameWriter;
@@ -229,8 +228,7 @@ public class ScanResultValueFramesIterable implements Iterable<FrameSignaturePai
       populateCursor();
       boolean firstRowWritten = false;
 
-      final FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
-          FrameType.COLUMNAR,
+      final FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
           memoryAllocatorFactory,
           currentOutputRowSignature,
           Collections.emptyList()
@@ -370,7 +368,6 @@ public class ScanResultValueFramesIterable implements Iterable<FrameSignaturePai
       currentRows = formattedRows;
       currentRowIndex = 0;
 
-
       return compatible;
     }
   }
diff --git a/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java
index 71d36bb9bbe..8527d551cf5 100644
--- a/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java
@@ -31,7 +31,6 @@ import com.google.inject.Inject;
 import org.apache.commons.lang.StringUtils;
 import org.apache.druid.data.input.MapBasedRow;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.MemoryAllocatorFactory;
 import org.apache.druid.frame.segment.FrameCursorUtils;
 import org.apache.druid.frame.write.FrameWriterFactory;
@@ -486,8 +485,7 @@ public class TimeseriesQueryQueryToolChest extends QueryToolChest<Result<Timeser
     RowSignature modifiedRowSignature = useNestedForUnknownTypes
                                         ? FrameWriterUtils.replaceUnknownTypesWithNestedColumns(rowSignature)
                                         : rowSignature;
-    FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
-        FrameType.COLUMNAR,
+    FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
         memoryAllocatorFactory,
         modifiedRowSignature,
         new ArrayList<>()
diff --git a/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java
index b850114f3bc..02d07e25570 100644
--- a/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java
@@ -28,7 +28,6 @@ import com.google.common.collect.Maps;
 import com.google.inject.Inject;
 import org.apache.druid.error.DruidException;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.MemoryAllocatorFactory;
 import org.apache.druid.frame.segment.FrameCursorUtils;
 import org.apache.druid.frame.write.FrameWriterFactory;
@@ -570,8 +569,7 @@ public class TopNQueryQueryToolChest extends QueryToolChest<Result<TopNResultVal
     RowSignature modifiedRowSignature = useNestedForUnknownTypes
                                         ? FrameWriterUtils.replaceUnknownTypesWithNestedColumns(rowSignature)
                                         : rowSignature;
-    FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
-        FrameType.COLUMNAR,
+    FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
         memoryAllocatorFactory,
         rowSignature,
         new ArrayList<>()
diff --git a/processing/src/test/java/org/apache/druid/frame/field/StringArrayFieldWriterTest.java b/processing/src/test/java/org/apache/druid/frame/field/StringArrayFieldWriterTest.java
index 02d4d44cbfc..6aba25ddf22 100644
--- a/processing/src/test/java/org/apache/druid/frame/field/StringArrayFieldWriterTest.java
+++ b/processing/src/test/java/org/apache/druid/frame/field/StringArrayFieldWriterTest.java
@@ -59,7 +59,7 @@ public class StringArrayFieldWriterTest extends InitializedNullHandlingTest
   public void setUp()
   {
     memory = WritableMemory.allocate(1000);
-    fieldWriter = new StringArrayFieldWriter(selector);
+    fieldWriter = new StringArrayFieldWriter(selector, false);
   }
 
   @After
diff --git a/processing/src/test/java/org/apache/druid/frame/field/StringFieldReaderTest.java b/processing/src/test/java/org/apache/druid/frame/field/StringFieldReaderTest.java
index 04296cb78c3..b0f589ed480 100644
--- a/processing/src/test/java/org/apache/druid/frame/field/StringFieldReaderTest.java
+++ b/processing/src/test/java/org/apache/druid/frame/field/StringFieldReaderTest.java
@@ -69,7 +69,7 @@ public class StringFieldReaderTest extends InitializedNullHandlingTest
   public void setUp()
   {
     memory = WritableMemory.allocate(1000);
-    fieldWriter = new StringArrayFieldWriter(writeSelector);
+    fieldWriter = new StringArrayFieldWriter(writeSelector, false);
   }
 
   @After
diff --git a/processing/src/test/java/org/apache/druid/frame/field/StringFieldWriterTest.java b/processing/src/test/java/org/apache/druid/frame/field/StringFieldWriterTest.java
index f44b69e2810..0108e772d94 100644
--- a/processing/src/test/java/org/apache/druid/frame/field/StringFieldWriterTest.java
+++ b/processing/src/test/java/org/apache/druid/frame/field/StringFieldWriterTest.java
@@ -65,8 +65,8 @@ public class StringFieldWriterTest extends InitializedNullHandlingTest
   public void setUp()
   {
     memory = WritableMemory.allocate(1000);
-    fieldWriter = new StringFieldWriter(selector);
-    fieldWriterUtf8 = new StringFieldWriter(selectorUtf8);
+    fieldWriter = new StringFieldWriter(selector, false);
+    fieldWriterUtf8 = new StringFieldWriter(selectorUtf8, false);
   }
 
   @After
diff --git a/processing/src/test/java/org/apache/druid/frame/key/KeyTestUtils.java b/processing/src/test/java/org/apache/druid/frame/key/KeyTestUtils.java
index acdbcc48f96..e5ab3c203f4 100644
--- a/processing/src/test/java/org/apache/druid/frame/key/KeyTestUtils.java
+++ b/processing/src/test/java/org/apache/druid/frame/key/KeyTestUtils.java
@@ -22,7 +22,6 @@ package org.apache.druid.frame.key;
 import org.apache.datasketches.memory.Memory;
 import org.apache.datasketches.memory.WritableMemory;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.HeapMemoryAllocator;
 import org.apache.druid.frame.allocation.SingleMemoryAllocatorFactory;
 import org.apache.druid.frame.write.FrameWriter;
@@ -93,11 +92,11 @@ public class KeyTestUtils
         false
     );
 
-    final FrameWriterFactory writerFactory = FrameWriters.makeFrameWriterFactory(
-        FrameType.ROW_BASED,
+    final FrameWriterFactory writerFactory = FrameWriters.makeRowBasedFrameWriterFactory(
         new SingleMemoryAllocatorFactory(HeapMemoryAllocator.unlimited()),
         keySignature,
-        Collections.emptyList()
+        Collections.emptyList(),
+        false
     );
 
     try (final FrameWriter writer = writerFactory.newFrameWriter(columnSelectorFactory)) {
diff --git a/processing/src/test/java/org/apache/druid/frame/processor/SuperSorterTest.java b/processing/src/test/java/org/apache/druid/frame/processor/SuperSorterTest.java
index 5450bd98fd2..3412eec678c 100644
--- a/processing/src/test/java/org/apache/druid/frame/processor/SuperSorterTest.java
+++ b/processing/src/test/java/org/apache/druid/frame/processor/SuperSorterTest.java
@@ -131,7 +131,8 @@ public class SuperSorterTest
           2,
           -1,
           null,
-          superSorterProgressTracker
+          superSorterProgressTracker,
+          false
       );
 
       superSorter.setNoWorkRunnable(() -> outputPartitionsFuture.set(ClusterByPartitions.oneUniversalPartition()));
@@ -306,7 +307,8 @@ public class SuperSorterTest
           maxChannelsPerProcessor,
           -1,
           null,
-          superSorterProgressTracker
+          superSorterProgressTracker,
+          false
       );
 
       superSorter.setNoWorkRunnable(() -> clusterByPartitionsFuture.set(clusterByPartitions));
diff --git a/processing/src/test/java/org/apache/druid/frame/testutil/FrameSequenceBuilder.java b/processing/src/test/java/org/apache/druid/frame/testutil/FrameSequenceBuilder.java
index e28cda0c2fb..573e5c52123 100644
--- a/processing/src/test/java/org/apache/druid/frame/testutil/FrameSequenceBuilder.java
+++ b/processing/src/test/java/org/apache/druid/frame/testutil/FrameSequenceBuilder.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.frame.testutil;
 
+import org.apache.druid.error.DruidException;
 import org.apache.druid.frame.Frame;
 import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.HeapMemoryAllocator;
@@ -119,13 +120,23 @@ public class FrameSequenceBuilder
 
   public Sequence<Frame> frames()
   {
-    final FrameWriterFactory frameWriterFactory =
-        FrameWriters.makeFrameWriterFactory(
-            frameType,
-            new SingleMemoryAllocatorFactory(allocator),
-            signature(),
-            keyColumns
-        );
+    final FrameWriterFactory frameWriterFactory;
+    if (FrameType.ROW_BASED.equals(frameType)) {
+      frameWriterFactory = FrameWriters.makeRowBasedFrameWriterFactory(
+          new SingleMemoryAllocatorFactory(allocator),
+          signature(),
+          keyColumns,
+          false
+      );
+    } else if (FrameType.COLUMNAR.equals(frameType)) {
+      frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
+          new SingleMemoryAllocatorFactory(allocator),
+          signature(),
+          keyColumns
+      );
+    } else {
+      throw DruidException.defensive("Unrecognized frame type");
+    }
 
     final Sequence<Cursor> cursors = FrameTestUtil.makeCursorsForAdapter(adapter, populateRowNumber);
 
diff --git a/processing/src/test/java/org/apache/druid/frame/write/FrameWriterTest.java b/processing/src/test/java/org/apache/druid/frame/write/FrameWriterTest.java
index 770d79beb76..cde617a395c 100644
--- a/processing/src/test/java/org/apache/druid/frame/write/FrameWriterTest.java
+++ b/processing/src/test/java/org/apache/druid/frame/write/FrameWriterTest.java
@@ -582,12 +582,21 @@ public class FrameWriterTest extends InitializedNullHandlingTest
                            null,
                            (retVal, cursor) -> {
                              int numRows = 0;
-                             final FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
-                                 outputFrameType,
-                                 new SingleMemoryAllocatorFactory(allocator),
-                                 signature,
-                                 keyColumns
-                             );
+                             final FrameWriterFactory frameWriterFactory;
+                             if (FrameType.ROW_BASED.equals(outputFrameType)) {
+                               frameWriterFactory = FrameWriters.makeRowBasedFrameWriterFactory(
+                                   new SingleMemoryAllocatorFactory(allocator),
+                                   signature,
+                                   keyColumns,
+                                   false
+                               );
+                             } else {
+                               frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
+                                   new SingleMemoryAllocatorFactory(allocator),
+                                   signature,
+                                   keyColumns
+                               );
+                             }
 
                              ColumnSelectorFactory columnSelectorFactory = cursor.getColumnSelectorFactory();
 
diff --git a/processing/src/test/java/org/apache/druid/frame/write/FrameWriterUtilsTest.java b/processing/src/test/java/org/apache/druid/frame/write/FrameWriterUtilsTest.java
new file mode 100644
index 00000000000..992247a5ac5
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/frame/write/FrameWriterUtilsTest.java
@@ -0,0 +1,85 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.frame.write;
+
+import org.apache.datasketches.memory.WritableMemory;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.nio.ByteBuffer;
+
+public class FrameWriterUtilsTest
+{
+
+  private static final byte[] INPUT_BYTE_ARRAY = new byte[]{0x0A, (byte) 0xA4, 0x00, 0x53};
+  private static final ByteBuffer INPUT_BYTE_BUFFER = ByteBuffer.wrap(INPUT_BYTE_ARRAY);
+  private static final WritableMemory WRITABLE_MEMORY = WritableMemory.allocate(10);
+
+  @Test
+  public void test_copyByteBufferToMemory_withAllowNullBytesOnArrayBackedBuffer()
+  {
+    int originalPosition = INPUT_BYTE_BUFFER.position();
+    FrameWriterUtils.copyByteBufferToMemoryAllowingNullBytes(INPUT_BYTE_BUFFER, WRITABLE_MEMORY, 0, 4);
+    byte[] outputArray = new byte[4];
+    WRITABLE_MEMORY.getByteArray(0, outputArray, 0, 4);
+    Assert.assertArrayEquals(INPUT_BYTE_ARRAY, outputArray);
+    Assert.assertEquals(originalPosition, INPUT_BYTE_BUFFER.position());
+  }
+
+  @Test
+  public void test_copyByteBufferToMemory_withAllowNullBytes()
+  {
+    int originalPosition = INPUT_BYTE_BUFFER.position();
+    ByteBuffer inputBuffer = ByteBuffer.allocateDirect(10);
+    inputBuffer.put(INPUT_BYTE_ARRAY, 0, 4);
+    inputBuffer.rewind();
+    FrameWriterUtils.copyByteBufferToMemoryAllowingNullBytes(inputBuffer, WRITABLE_MEMORY, 0, 4);
+    byte[] outputArray = new byte[4];
+    WRITABLE_MEMORY.getByteArray(0, outputArray, 0, 4);
+    Assert.assertArrayEquals(INPUT_BYTE_ARRAY, outputArray);
+    Assert.assertEquals(originalPosition, INPUT_BYTE_BUFFER.position());
+  }
+
+  @Test
+  public void test_copyByteBufferToMemory_withRemoveNullBytes()
+  {
+    int originalPosition = INPUT_BYTE_BUFFER.position();
+    FrameWriterUtils.copyByteBufferToMemoryDisallowingNullBytes(INPUT_BYTE_BUFFER, WRITABLE_MEMORY, 0, 4, true);
+    byte[] outputArray = new byte[3];
+    WRITABLE_MEMORY.getByteArray(0, outputArray, 0, 3);
+    Assert.assertArrayEquals(new byte[]{0x0A, (byte) 0xA4, 0x53}, outputArray);
+    Assert.assertEquals(originalPosition, INPUT_BYTE_BUFFER.position());
+  }
+
+  @Test
+  public void test_copyByteBufferToMemory_withDisallowedNullBytes()
+  {
+    Assert.assertThrows(
+        InvalidNullByteException.class,
+        () -> FrameWriterUtils.copyByteBufferToMemoryDisallowingNullBytes(
+            INPUT_BYTE_BUFFER,
+            WRITABLE_MEMORY,
+            0,
+            4,
+            false
+        )
+    );
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/frame/write/FrameWritersTest.java b/processing/src/test/java/org/apache/druid/frame/write/FrameWritersTest.java
index d43ba034c2a..98d9fc058c2 100644
--- a/processing/src/test/java/org/apache/druid/frame/write/FrameWritersTest.java
+++ b/processing/src/test/java/org/apache/druid/frame/write/FrameWritersTest.java
@@ -19,7 +19,6 @@
 
 package org.apache.druid.frame.write;
 
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.ArenaMemoryAllocatorFactory;
 import org.apache.druid.frame.key.KeyColumn;
 import org.apache.druid.frame.key.KeyOrder;
@@ -37,8 +36,8 @@ import org.junit.internal.matchers.ThrowableMessageMatcher;
 import java.util.Collections;
 
 /**
- * Tests {@link FrameWriters#makeFrameWriterFactory} ability to create factories. Largely doesn't test actual
- * frame generation via the factories, since that is exercised well enough in other test suites.
+ * Tests {@link FrameWriters#makeRowBasedFrameWriterFactory} and {@link FrameWriters#makeColumnBasedFrameWriterFactory} ability to create factories.
+ * Largely doesn't test actual frame generation via the factories, since that is exercised well enough in other test suites.
  */
 public class FrameWritersTest extends InitializedNullHandlingTest
 {
@@ -47,11 +46,11 @@ public class FrameWritersTest extends InitializedNullHandlingTest
   @Test
   public void test_rowBased()
   {
-    final FrameWriterFactory factory = FrameWriters.makeFrameWriterFactory(
-        FrameType.ROW_BASED,
+    final FrameWriterFactory factory = FrameWriters.makeRowBasedFrameWriterFactory(
         new ArenaMemoryAllocatorFactory(ALLOCATOR_CAPACITY),
         RowSignature.builder().add("x", ColumnType.LONG).build(),
-        Collections.singletonList(new KeyColumn("x", KeyOrder.ASCENDING))
+        Collections.singletonList(new KeyColumn("x", KeyOrder.ASCENDING)),
+        false
     );
 
     MatcherAssert.assertThat(factory, CoreMatchers.instanceOf(RowBasedFrameWriterFactory.class));
@@ -61,8 +60,7 @@ public class FrameWritersTest extends InitializedNullHandlingTest
   @Test
   public void test_columnar()
   {
-    final FrameWriterFactory factory = FrameWriters.makeFrameWriterFactory(
-        FrameType.COLUMNAR,
+    final FrameWriterFactory factory = FrameWriters.makeColumnBasedFrameWriterFactory(
         new ArenaMemoryAllocatorFactory(ALLOCATOR_CAPACITY),
         RowSignature.builder()
                     .add("a", ColumnType.LONG)
@@ -84,8 +82,7 @@ public class FrameWritersTest extends InitializedNullHandlingTest
   @Test
   public void test_columnar_unsupportedColumnType()
   {
-    final FrameWriterFactory factory = FrameWriters.makeFrameWriterFactory(
-        FrameType.COLUMNAR,
+    final FrameWriterFactory factory = FrameWriters.makeColumnBasedFrameWriterFactory(
         new ArenaMemoryAllocatorFactory(ALLOCATOR_CAPACITY),
         RowSignature.builder().add("x", ColumnType.ofArray(ColumnType.LONG_ARRAY)).build(),
         Collections.emptyList()
@@ -106,11 +103,11 @@ public class FrameWritersTest extends InitializedNullHandlingTest
     final IllegalArgumentException e = Assert.assertThrows(
         IllegalArgumentException.class,
         () ->
-            FrameWriters.makeFrameWriterFactory(
-                FrameType.ROW_BASED,
+            FrameWriters.makeRowBasedFrameWriterFactory(
                 new ArenaMemoryAllocatorFactory(ALLOCATOR_CAPACITY),
                 RowSignature.builder().add("x", ColumnType.LONG).add("y", ColumnType.LONG).build(),
-                Collections.singletonList(new KeyColumn("y", KeyOrder.ASCENDING))
+                Collections.singletonList(new KeyColumn("y", KeyOrder.ASCENDING)),
+                false
             )
     );
 
@@ -128,8 +125,7 @@ public class FrameWritersTest extends InitializedNullHandlingTest
     final IllegalArgumentException e = Assert.assertThrows(
         IllegalArgumentException.class,
         () ->
-            FrameWriters.makeFrameWriterFactory(
-                FrameType.COLUMNAR,
+            FrameWriters.makeColumnBasedFrameWriterFactory(
                 new ArenaMemoryAllocatorFactory(ALLOCATOR_CAPACITY),
                 RowSignature.builder().add("x", ColumnType.LONG).build(),
                 Collections.singletonList(new KeyColumn("x", KeyOrder.ASCENDING))
diff --git a/processing/src/test/java/org/apache/druid/query/FrameBasedInlineDataSourceSerializerTest.java b/processing/src/test/java/org/apache/druid/query/FrameBasedInlineDataSourceSerializerTest.java
index 7899a6aed84..238997c2e53 100644
--- a/processing/src/test/java/org/apache/druid/query/FrameBasedInlineDataSourceSerializerTest.java
+++ b/processing/src/test/java/org/apache/druid/query/FrameBasedInlineDataSourceSerializerTest.java
@@ -24,7 +24,6 @@ import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.HeapMemoryAllocator;
 import org.apache.druid.frame.allocation.SingleMemoryAllocatorFactory;
 import org.apache.druid.frame.segment.FrameCursorUtils;
@@ -134,11 +133,11 @@ public class FrameBasedInlineDataSourceSerializerTest
     RowSignature modifiedRowSignature = FrameWriterUtils.replaceUnknownTypesWithNestedColumns(rowSignature);
     Sequence<Frame> frames = FrameCursorUtils.cursorToFramesSequence(
         cursor,
-        FrameWriters.makeFrameWriterFactory(
-            FrameType.ROW_BASED,
+        FrameWriters.makeRowBasedFrameWriterFactory(
             new SingleMemoryAllocatorFactory(HeapMemoryAllocator.unlimited()),
             modifiedRowSignature,
-            new ArrayList<>()
+            new ArrayList<>(),
+            false
         )
     );
     return new FrameBasedInlineDataSource(
diff --git a/processing/src/test/java/org/apache/druid/segment/join/table/FrameBasedIndexedTableTest.java b/processing/src/test/java/org/apache/druid/segment/join/table/FrameBasedIndexedTableTest.java
index 8b093184d57..64c815f55d4 100644
--- a/processing/src/test/java/org/apache/druid/segment/join/table/FrameBasedIndexedTableTest.java
+++ b/processing/src/test/java/org/apache/druid/segment/join/table/FrameBasedIndexedTableTest.java
@@ -26,7 +26,6 @@ import it.unimi.dsi.fastutil.ints.IntBidirectionalIterator;
 import it.unimi.dsi.fastutil.ints.IntSortedSet;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.FrameType;
 import org.apache.druid.frame.allocation.HeapMemoryAllocator;
 import org.apache.druid.frame.allocation.SingleMemoryAllocatorFactory;
 import org.apache.druid.frame.segment.FrameCursorUtils;
@@ -217,8 +216,7 @@ public class FrameBasedIndexedTableTest extends InitializedNullHandlingTest
   {
     cursorCloseablePair = IterableRowsCursorHelper.getCursorFromIterable(DATASOURCE_ROWS, ROW_SIGNATURE);
     Cursor cursor = cursorCloseablePair.lhs;
-    FrameWriterFactory frameWriterFactory = FrameWriters.makeFrameWriterFactory(
-        FrameType.COLUMNAR,
+    FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
         new SingleMemoryAllocatorFactory(HeapMemoryAllocator.unlimited()),
         ROW_SIGNATURE,
         new ArrayList<>()

From b772277d3b86022759178a5e310d7bdbef332c6a Mon Sep 17 00:00:00 2001
From: Rahul Bansal <61049580+rahulbansal3005@users.noreply.github.com>
Date: Wed, 26 Jun 2024 17:38:37 +0530
Subject: [PATCH 26/72] Update intellij-setup.md (#16655)

updating typing mistakes
---
 dev/intellij-setup.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dev/intellij-setup.md b/dev/intellij-setup.md
index 5c4cdc52f3d..c08375a3347 100644
--- a/dev/intellij-setup.md
+++ b/dev/intellij-setup.md
@@ -55,7 +55,7 @@ The installation of a MySQL metadata store is outside the scope of this document
 Use of other databases such as Postgres or Derby are entirely reasonable, but doing so is left as an excercise to the reader.
 
 ## ZooKeeper
-This also assumes you have [ZooKeeper](http://zookeeper.apache.org/releases.html) running locally, which usually just involves downloading the latst distribution of ZooKeeper, doing some minor configuration in ZooKeeper's `conf/` directory (most defaults are fine), then running `./bin/zkServer.sh start` in the ZooKeeper directory. 
+This also assumes you have [ZooKeeper](http://zookeeper.apache.org/releases.html) running locally, which usually just involves downloading the latest distribution of ZooKeeper, doing some minor configuration in ZooKeeper's `conf/` directory (most defaults are fine), then running `./bin/zkServer.sh start` in the ZooKeeper directory. 
 
 On macOS, you can also achieve this through the following commands
 

From 82117e8101df29760f36ba9d1fd872a091ea799a Mon Sep 17 00:00:00 2001
From: Abhishek Radhakrishnan <abhishek.rb19@gmail.com>
Date: Wed, 26 Jun 2024 09:29:51 -0700
Subject: [PATCH 27/72] Add MSQ query context `maxNumSegments` (#16637)

* Add MSQ query context maxNumSegments.

- Default is MAX_INT (unbounded).
- When set and if a time chunk contains more number of segments than set in the
  query context, the MSQ task will fail with TooManySegments fault.

* Fixup hashCode().

* Rename and checkpoint.

* Add some insert and replace happy and sad path tests.

* Update error msg.

* Commentary

* Adjust the default to be null (meaning no max bound on number of segments).

Also fix formatter.

* Fix CodeQL warnings and minor cleanup.

* Assert on maxNumSegments tuning config.

* Minor test cleanup.

* Use null default for the MultiStageQueryContext as well

* Review feedback

* Review feedback

* Move logic to common function getPartitionsByBucket shared by INSERT and REPLACE.

* Rename to validateNumSegmentsPerBucketOrThrow() for consistency.

* Add segmentGranularity to error message.
---
 .../apache/druid/msq/exec/ControllerImpl.java |  59 +++++++-
 .../druid/msq/guice/MSQIndexingModule.java    |   2 +
 .../druid/msq/indexing/MSQTuningConfig.java   |  24 +++-
 .../TooManySegmentsInTimeChunkFault.java      | 130 ++++++++++++++++++
 .../druid/msq/sql/MSQTaskQueryMaker.java      |   3 +-
 .../msq/util/MultiStageQueryContext.java      |   8 ++
 .../apache/druid/msq/exec/MSQFaultsTest.java  |  50 ++++++-
 .../apache/druid/msq/exec/MSQInsertTest.java  |  63 +++++++++
 .../apache/druid/msq/exec/MSQReplaceTest.java |  64 +++++++++
 .../msq/indexing/MSQTuningConfigTest.java     |   1 +
 .../msq/indexing/error/MSQFaultSerdeTest.java |   3 +
 .../apache/druid/msq/test/MSQTestBase.java    |   4 +
 12 files changed, 400 insertions(+), 11 deletions(-)
 create mode 100644 extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/TooManySegmentsInTimeChunkFault.java

diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
index d6732364985..ad37c5380c5 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
@@ -119,6 +119,7 @@ import org.apache.druid.msq.indexing.error.MSQFault;
 import org.apache.druid.msq.indexing.error.MSQWarningReportLimiterPublisher;
 import org.apache.druid.msq.indexing.error.QueryNotSupportedFault;
 import org.apache.druid.msq.indexing.error.TooManyBucketsFault;
+import org.apache.druid.msq.indexing.error.TooManySegmentsInTimeChunkFault;
 import org.apache.druid.msq.indexing.error.TooManyWarningsFault;
 import org.apache.druid.msq.indexing.error.UnknownFault;
 import org.apache.druid.msq.indexing.error.WorkerRpcFailedFault;
@@ -962,6 +963,14 @@ public class ControllerImpl implements Controller
 
     final Granularity segmentGranularity = destination.getSegmentGranularity();
 
+    // Compute & validate partitions by bucket (time chunk) if there is a maximum number of segments to be enforced per time chunk
+    if (querySpec.getTuningConfig().getMaxNumSegments() != null) {
+      final Map<DateTime, List<Pair<Integer, ClusterByPartition>>> partitionsByBucket =
+          getPartitionsByBucket(partitionBoundaries, segmentGranularity, keyReader);
+
+      validateNumSegmentsPerBucketOrThrow(partitionsByBucket, segmentGranularity);
+    }
+
     String previousSegmentId = null;
 
     segmentReport = new MSQSegmentReport(
@@ -1029,6 +1038,43 @@ public class ControllerImpl implements Controller
     return retVal;
   }
 
+  /**
+   * Return partition ranges by bucket (time chunk).
+   */
+  private Map<DateTime, List<Pair<Integer, ClusterByPartition>>> getPartitionsByBucket(
+      final ClusterByPartitions partitionBoundaries,
+      final Granularity segmentGranularity,
+      final RowKeyReader keyReader
+  )
+  {
+    final Map<DateTime, List<Pair<Integer, ClusterByPartition>>> partitionsByBucket = new HashMap<>();
+    for (int i = 0; i < partitionBoundaries.ranges().size(); i++) {
+      final ClusterByPartition partitionBoundary = partitionBoundaries.ranges().get(i);
+      final DateTime bucketDateTime = getBucketDateTime(partitionBoundary, segmentGranularity, keyReader);
+      partitionsByBucket.computeIfAbsent(bucketDateTime, ignored -> new ArrayList<>())
+                        .add(Pair.of(i, partitionBoundary));
+    }
+    return partitionsByBucket;
+  }
+
+  private void validateNumSegmentsPerBucketOrThrow(
+      final Map<DateTime, List<Pair<Integer, ClusterByPartition>>> partitionsByBucket,
+      final Granularity segmentGranularity
+  )
+  {
+    final Integer maxNumSegments = querySpec.getTuningConfig().getMaxNumSegments();
+    if (maxNumSegments == null) {
+      // Return early because a null value indicates no maximum, i.e., a time chunk can have any number of segments.
+      return;
+    }
+    for (final Map.Entry<DateTime, List<Pair<Integer, ClusterByPartition>>> bucketEntry : partitionsByBucket.entrySet()) {
+      final int numSegmentsInTimeChunk = bucketEntry.getValue().size();
+      if (numSegmentsInTimeChunk > maxNumSegments) {
+        throw new MSQException(new TooManySegmentsInTimeChunkFault(bucketEntry.getKey(), numSegmentsInTimeChunk, maxNumSegments, segmentGranularity));
+      }
+    }
+  }
+
   /**
    * Used by {@link #generateSegmentIdsWithShardSpecs}.
    *
@@ -1072,13 +1118,11 @@ public class ControllerImpl implements Controller
     }
 
     // Group partition ranges by bucket (time chunk), so we can generate shardSpecs for each bucket independently.
-    final Map<DateTime, List<Pair<Integer, ClusterByPartition>>> partitionsByBucket = new HashMap<>();
-    for (int i = 0; i < partitionBoundaries.ranges().size(); i++) {
-      ClusterByPartition partitionBoundary = partitionBoundaries.ranges().get(i);
-      final DateTime bucketDateTime = getBucketDateTime(partitionBoundary, segmentGranularity, keyReader);
-      partitionsByBucket.computeIfAbsent(bucketDateTime, ignored -> new ArrayList<>())
-                        .add(Pair.of(i, partitionBoundary));
-    }
+    final Map<DateTime, List<Pair<Integer, ClusterByPartition>>> partitionsByBucket =
+        getPartitionsByBucket(partitionBoundaries, segmentGranularity, keyReader);
+
+    // Validate the buckets.
+    validateNumSegmentsPerBucketOrThrow(partitionsByBucket, segmentGranularity);
 
     // Process buckets (time chunks) one at a time.
     for (final Map.Entry<DateTime, List<Pair<Integer, ClusterByPartition>>> bucketEntry : partitionsByBucket.entrySet()) {
@@ -1090,6 +1134,7 @@ public class ControllerImpl implements Controller
       }
 
       final List<Pair<Integer, ClusterByPartition>> ranges = bucketEntry.getValue();
+
       String version = null;
 
       final List<TaskLock> locks = context.taskActionClient().submit(new LockListAction());
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQIndexingModule.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQIndexingModule.java
index f4d24cfc5c4..c64c893e5cd 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQIndexingModule.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQIndexingModule.java
@@ -59,6 +59,7 @@ import org.apache.druid.msq.indexing.error.TooManyColumnsFault;
 import org.apache.druid.msq.indexing.error.TooManyInputFilesFault;
 import org.apache.druid.msq.indexing.error.TooManyPartitionsFault;
 import org.apache.druid.msq.indexing.error.TooManyRowsWithSameKeyFault;
+import org.apache.druid.msq.indexing.error.TooManySegmentsInTimeChunkFault;
 import org.apache.druid.msq.indexing.error.TooManyWarningsFault;
 import org.apache.druid.msq.indexing.error.TooManyWorkersFault;
 import org.apache.druid.msq.indexing.error.UnknownFault;
@@ -126,6 +127,7 @@ public class MSQIndexingModule implements DruidModule
       TooManyInputFilesFault.class,
       TooManyPartitionsFault.class,
       TooManyRowsWithSameKeyFault.class,
+      TooManySegmentsInTimeChunkFault.class,
       TooManyWarningsFault.class,
       TooManyWorkersFault.class,
       TooManyAttemptsForJob.class,
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQTuningConfig.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQTuningConfig.java
index f36cbec2b39..b6958b2df5e 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQTuningConfig.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQTuningConfig.java
@@ -56,6 +56,9 @@ public class MSQTuningConfig
   @Nullable
   private final Integer rowsPerSegment;
 
+  @Nullable
+  private final Integer maxNumSegments;
+
   @Nullable
   private final IndexSpec indexSpec;
 
@@ -63,18 +66,20 @@ public class MSQTuningConfig
       @JsonProperty("maxNumWorkers") @Nullable final Integer maxNumWorkers,
       @JsonProperty("maxRowsInMemory") @Nullable final Integer maxRowsInMemory,
       @JsonProperty("rowsPerSegment") @Nullable final Integer rowsPerSegment,
+      @JsonProperty("maxNumSegments") @Nullable final Integer maxNumSegments,
       @JsonProperty("indexSpec") @Nullable final IndexSpec indexSpec
   )
   {
     this.maxNumWorkers = maxNumWorkers;
     this.maxRowsInMemory = maxRowsInMemory;
     this.rowsPerSegment = rowsPerSegment;
+    this.maxNumSegments = maxNumSegments;
     this.indexSpec = indexSpec;
   }
 
   public static MSQTuningConfig defaultConfig()
   {
-    return new MSQTuningConfig(null, null, null, null);
+    return new MSQTuningConfig(null, null, null, null, null);
   }
 
   @JsonProperty("maxNumWorkers")
@@ -98,6 +103,13 @@ public class MSQTuningConfig
     return rowsPerSegment;
   }
 
+  @JsonProperty("maxNumSegments")
+  @JsonInclude(JsonInclude.Include.NON_NULL)
+  Integer getMaxNumSegmentsForSerialization()
+  {
+    return maxNumSegments;
+  }
+
   @JsonProperty("indexSpec")
   @JsonInclude(JsonInclude.Include.NON_NULL)
   IndexSpec getIndexSpecForSerialization()
@@ -120,6 +132,12 @@ public class MSQTuningConfig
     return rowsPerSegment != null ? rowsPerSegment : PartitionsSpec.DEFAULT_MAX_ROWS_PER_SEGMENT;
   }
 
+  @Nullable
+  public Integer getMaxNumSegments()
+  {
+    return maxNumSegments;
+  }
+
   public IndexSpec getIndexSpec()
   {
     return indexSpec != null ? indexSpec : IndexSpec.DEFAULT;
@@ -138,13 +156,14 @@ public class MSQTuningConfig
     return Objects.equals(maxNumWorkers, that.maxNumWorkers)
            && Objects.equals(maxRowsInMemory, that.maxRowsInMemory)
            && Objects.equals(rowsPerSegment, that.rowsPerSegment)
+           && Objects.equals(maxNumSegments, that.maxNumSegments)
            && Objects.equals(indexSpec, that.indexSpec);
   }
 
   @Override
   public int hashCode()
   {
-    return Objects.hash(maxNumWorkers, maxRowsInMemory, rowsPerSegment, indexSpec);
+    return Objects.hash(maxNumWorkers, maxRowsInMemory, rowsPerSegment, maxNumSegments, indexSpec);
   }
 
   @Override
@@ -154,6 +173,7 @@ public class MSQTuningConfig
            "maxNumWorkers=" + maxNumWorkers +
            ", maxRowsInMemory=" + maxRowsInMemory +
            ", rowsPerSegment=" + rowsPerSegment +
+           ", maxNumSegments=" + maxNumSegments +
            ", indexSpec=" + indexSpec +
            '}';
   }
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/TooManySegmentsInTimeChunkFault.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/TooManySegmentsInTimeChunkFault.java
new file mode 100644
index 00000000000..ac0c2a641da
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/TooManySegmentsInTimeChunkFault.java
@@ -0,0 +1,130 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.indexing.error;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import com.fasterxml.jackson.annotation.JsonTypeName;
+import org.apache.druid.java.util.common.granularity.Granularity;
+import org.apache.druid.java.util.common.granularity.GranularityType;
+import org.apache.druid.msq.util.MultiStageQueryContext;
+import org.joda.time.DateTime;
+
+import java.util.Objects;
+
+@JsonTypeName(TooManySegmentsInTimeChunkFault.CODE)
+public class TooManySegmentsInTimeChunkFault extends BaseMSQFault
+{
+  public static final String CODE = "TooManySegmentsInTimeChunk";
+
+  private final DateTime timeChunk;
+  private final int numSegments;
+  private final int maxNumSegments;
+  private final Granularity segmentGranularity;
+
+  @JsonCreator
+  public TooManySegmentsInTimeChunkFault(
+      @JsonProperty("timeChunk") final DateTime timeChunk,
+      @JsonProperty("numSegments") final int numSegments,
+      @JsonProperty("maxNumSegments") final int maxNumSegments,
+      @JsonProperty("segmentGranularity") final Granularity segmentGranularity
+  )
+  {
+    super(
+        CODE,
+        "Too many segments requested to be generated in time chunk[%s] with granularity[%s]"
+        + " (requested = [%,d], maximum = [%,d]). Please try breaking up your query or change the maximum using"
+        + " the query context parameter[%s].",
+        timeChunk,
+        convertToGranularityString(segmentGranularity),
+        numSegments,
+        maxNumSegments,
+        MultiStageQueryContext.CTX_MAX_NUM_SEGMENTS
+    );
+    this.timeChunk = timeChunk;
+    this.numSegments = numSegments;
+    this.maxNumSegments = maxNumSegments;
+    this.segmentGranularity = segmentGranularity;
+  }
+
+  /**
+   * Convert the given granularity to a more user-friendly granularity string, when possible.
+   */
+  private static String convertToGranularityString(final Granularity granularity)
+  {
+    // If it's a "standard" granularity, we get a nicer string from the GranularityType enum. For any other
+    // granularity, we just fall back to the toString(). See GranularityType#isStandard().
+    for (GranularityType value : GranularityType.values()) {
+      if (value.getDefaultGranularity().equals(granularity)) {
+        return value.name();
+      }
+    }
+    return granularity.toString();
+  }
+
+  @JsonProperty
+  public DateTime getTimeChunk()
+  {
+    return timeChunk;
+  }
+
+  @JsonProperty
+  public int getNumSegments()
+  {
+    return numSegments;
+  }
+
+  @JsonProperty
+  public int getMaxNumSegments()
+  {
+    return maxNumSegments;
+  }
+
+  @JsonProperty
+  public Granularity getSegmentGranularity()
+  {
+    return segmentGranularity;
+  }
+
+  @Override
+  public boolean equals(Object o)
+  {
+    if (this == o) {
+      return true;
+    }
+    if (o == null || getClass() != o.getClass()) {
+      return false;
+    }
+    if (!super.equals(o)) {
+      return false;
+    }
+    TooManySegmentsInTimeChunkFault that = (TooManySegmentsInTimeChunkFault) o;
+    return numSegments == that.numSegments
+           && maxNumSegments == that.maxNumSegments
+           && Objects.equals(timeChunk, that.timeChunk)
+           && Objects.equals(segmentGranularity, that.segmentGranularity);
+  }
+
+  @Override
+  public int hashCode()
+  {
+    return Objects.hash(super.hashCode(), timeChunk, numSegments, maxNumSegments, segmentGranularity);
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/sql/MSQTaskQueryMaker.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/sql/MSQTaskQueryMaker.java
index 58031558a0a..c6396c0b306 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/sql/MSQTaskQueryMaker.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/sql/MSQTaskQueryMaker.java
@@ -162,6 +162,7 @@ public class MSQTaskQueryMaker implements QueryMaker
     final int maxNumWorkers = maxNumTasks - 1;
     final int rowsPerSegment = MultiStageQueryContext.getRowsPerSegment(sqlQueryContext);
     final int maxRowsInMemory = MultiStageQueryContext.getRowsInMemory(sqlQueryContext);
+    final Integer maxNumSegments = MultiStageQueryContext.getMaxNumSegments(sqlQueryContext);
     final IndexSpec indexSpec = MultiStageQueryContext.getIndexSpec(sqlQueryContext, jsonMapper);
     final boolean finalizeAggregations = MultiStageQueryContext.isFinalizeAggregations(sqlQueryContext);
 
@@ -279,7 +280,7 @@ public class MSQTaskQueryMaker implements QueryMaker
                .columnMappings(new ColumnMappings(columnMappings))
                .destination(destination)
                .assignmentStrategy(MultiStageQueryContext.getAssignmentStrategy(sqlQueryContext))
-               .tuningConfig(new MSQTuningConfig(maxNumWorkers, maxRowsInMemory, rowsPerSegment, indexSpec))
+               .tuningConfig(new MSQTuningConfig(maxNumWorkers, maxRowsInMemory, rowsPerSegment, maxNumSegments, indexSpec))
                .build();
 
     MSQTaskQueryMakerUtils.validateRealtimeReindex(querySpec);
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
index d001e0177a6..f8bdb36bfae 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
@@ -149,6 +149,8 @@ public class MultiStageQueryContext
 
   public static final String CTX_IS_REINDEX = "isReindex";
 
+  public static final String CTX_MAX_NUM_SEGMENTS = "maxNumSegments";
+
   /**
    * Controls sort order within segments. Normally, this is the same as the overall order of the query (from the
    * CLUSTERED BY clause) but it can be overridden.
@@ -324,6 +326,12 @@ public class MultiStageQueryContext
     return queryContext.getInt(CTX_ROWS_IN_MEMORY, DEFAULT_ROWS_IN_MEMORY);
   }
 
+  public static Integer getMaxNumSegments(final QueryContext queryContext)
+  {
+    // The default is null, if the context is not set.
+    return queryContext.getInt(CTX_MAX_NUM_SEGMENTS);
+  }
+
   public static List<String> getSortOrder(final QueryContext queryContext)
   {
     return decodeList(CTX_SORT_ORDER, queryContext.getString(CTX_SORT_ORDER));
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java
index 425609628b3..d144e765957 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java
@@ -29,9 +29,11 @@ import org.apache.druid.indexing.common.actions.RetrieveUsedSegmentsAction;
 import org.apache.druid.indexing.common.actions.SegmentAllocateAction;
 import org.apache.druid.indexing.common.actions.TaskAction;
 import org.apache.druid.indexing.common.task.Tasks;
+import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.msq.indexing.error.InsertCannotAllocateSegmentFault;
 import org.apache.druid.msq.indexing.error.InsertCannotBeEmptyFault;
 import org.apache.druid.msq.indexing.error.InsertTimeNullFault;
@@ -41,6 +43,7 @@ import org.apache.druid.msq.indexing.error.TooManyClusteredByColumnsFault;
 import org.apache.druid.msq.indexing.error.TooManyColumnsFault;
 import org.apache.druid.msq.indexing.error.TooManyInputFilesFault;
 import org.apache.druid.msq.indexing.error.TooManyPartitionsFault;
+import org.apache.druid.msq.indexing.error.TooManySegmentsInTimeChunkFault;
 import org.apache.druid.msq.test.MSQTestBase;
 import org.apache.druid.msq.test.MSQTestTaskActionClient;
 import org.apache.druid.segment.column.ColumnType;
@@ -284,7 +287,7 @@ public class MSQFaultsTest extends MSQTestBase
   }
 
   @Test
-  public void testInsertWithTooManySegments() throws IOException
+  public void testInsertWithTooManyPartitions() throws IOException
   {
     Map<String, Object> context = ImmutableMap.<String, Object>builder()
                                               .putAll(DEFAULT_MSQ_CONTEXT)
@@ -316,6 +319,51 @@ public class MSQFaultsTest extends MSQTestBase
 
   }
 
+  @Test
+  public void testReplaceWithTooManySegmentsInTimeChunk() throws IOException
+  {
+    // Each segment will contain at most 10 rows. So with ALL granularity, an ingest query will
+    // attempt to generate a total of 5 segments for 50 input rows but will fail since only 1 segment is allowed.
+    final int maxNumSegments = 1;
+    final int rowsPerSegment = 10;
+    final int numRowsInInputFile = 50;
+
+    final Map<String, Object> context = ImmutableMap.<String, Object>builder()
+                                              .putAll(DEFAULT_MSQ_CONTEXT)
+                                              .put("maxNumSegments", maxNumSegments)
+                                              .put("rowsPerSegment", rowsPerSegment)
+                                              .build();
+
+
+    final File file = createNdJsonFile(newTempFile("ndjson30k"), numRowsInInputFile, 1);
+    final String filePathAsJson = queryFramework().queryJsonMapper().writeValueAsString(file.getAbsolutePath());
+
+    testIngestQuery().setSql(
+                         "REPLACE INTO foo1 "
+                         + " OVERWRITE ALL "
+                         + " SELECT FLOOR(TIME_PARSE(\"timestamp\") to day) AS __time"
+                         + " FROM TABLE(\n"
+                         + "  EXTERN(\n"
+                         + "    '{ \"files\": [" + filePathAsJson + "],\"type\":\"local\"}',\n"
+                         + "    '{\"type\": \"json\"}',\n"
+                         + "    '[{\"name\": \"timestamp\",\"type\":\"string\"}]'\n"
+                         + "  )\n"
+                         + " ) PARTITIONED BY ALL")
+                     .setExpectedDataSource("foo1")
+                     .setExpectedRowSignature(RowSignature.builder().add("__time", ColumnType.LONG).build())
+                     .setQueryContext(context)
+                     .setExpectedMSQFault(
+                         new TooManySegmentsInTimeChunkFault(
+                             DateTimes.of("1970-01-01"),
+                             numRowsInInputFile / rowsPerSegment,
+                             maxNumSegments,
+                             Granularities.ALL
+                         )
+                     )
+                     .verifyResults();
+
+  }
+
   /**
    * Helper method that populates a file with {@code numRows} rows and {@code numColumns} columns where the
    * first column is a string 'timestamp' while the rest are string columns with junk value
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java
index ecdc30294db..03ed429848a 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java
@@ -30,11 +30,13 @@ import org.apache.druid.error.DruidExceptionMatcher;
 import org.apache.druid.hll.HyperLogLogCollector;
 import org.apache.druid.indexing.common.TaskLockType;
 import org.apache.druid.indexing.common.task.Tasks;
+import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.msq.indexing.error.ColumnNameRestrictedFault;
 import org.apache.druid.msq.indexing.error.RowTooLargeFault;
+import org.apache.druid.msq.indexing.error.TooManySegmentsInTimeChunkFault;
 import org.apache.druid.msq.indexing.report.MSQSegmentReport;
 import org.apache.druid.msq.kernel.WorkerAssignmentStrategy;
 import org.apache.druid.msq.test.CounterSnapshotMatcher;
@@ -50,6 +52,7 @@ import org.apache.druid.timeline.SegmentId;
 import org.apache.druid.timeline.partition.NumberedShardSpec;
 import org.hamcrest.CoreMatchers;
 import org.junit.internal.matchers.ThrowableMessageMatcher;
+import org.junit.jupiter.api.Test;
 import org.junit.jupiter.params.ParameterizedTest;
 import org.junit.jupiter.params.provider.MethodSource;
 import org.mockito.Mockito;
@@ -1366,6 +1369,66 @@ public class MSQInsertTest extends MSQTestBase
                      .verifyExecutionError();
   }
 
+  @Test
+  public void testInsertWithTooManySegmentsInTimeChunk()
+  {
+    final Map<String, Object> context = ImmutableMap.<String, Object>builder()
+                                                    .putAll(DEFAULT_MSQ_CONTEXT)
+                                                    .put("maxNumSegments", 1)
+                                                    .put("rowsPerSegment", 1)
+                                                    .build();
+
+    testIngestQuery().setSql("INSERT INTO foo"
+                             + " SELECT TIME_PARSE(ts) AS __time, c1 "
+                             + " FROM (VALUES('2023-01-01', 'day1_1'), ('2023-01-01', 'day1_2'), ('2023-02-01', 'day2')) AS t(ts, c1)"
+                             + " PARTITIONED BY DAY")
+                     .setExpectedDataSource("foo")
+                     .setExpectedRowSignature(RowSignature.builder().add("__time", ColumnType.LONG).build())
+                     .setQueryContext(context)
+                     .setExpectedMSQFault(
+                         new TooManySegmentsInTimeChunkFault(
+                             DateTimes.of("2023-01-01"),
+                             2,
+                             1,
+                             Granularities.DAY
+                         )
+                     )
+                     .verifyResults();
+
+  }
+
+  @Test
+  public void testInsertWithMaxNumSegments()
+  {
+    final Map<String, Object> context = ImmutableMap.<String, Object>builder()
+                                                    .putAll(DEFAULT_MSQ_CONTEXT)
+                                                    .put("maxNumSegments", 2)
+                                                    .put("rowsPerSegment", 1)
+                                                    .build();
+
+    final RowSignature expectedRowSignature = RowSignature.builder()
+                                                          .add("__time", ColumnType.LONG)
+                                                          .add("c1", ColumnType.STRING)
+                                                          .build();
+    // Ingest query should at most generate 2 segments per time chunk
+    // i.e. 2 segments for the first time chunk and 1 segment for the last time chunk.
+    testIngestQuery().setSql("INSERT INTO foo"
+                             + " SELECT TIME_PARSE(ts) AS __time, c1 "
+                             + " FROM (VALUES('2023-01-01', 'day1_1'), ('2023-01-01', 'day1_2'), ('2023-02-01', 'day2')) AS t(ts, c1)"
+                             + " PARTITIONED BY DAY")
+                     .setQueryContext(context)
+                     .setExpectedDataSource("foo")
+                     .setExpectedRowSignature(expectedRowSignature)
+                     .setExpectedResultRows(
+                         ImmutableList.of(
+                             new Object[]{1672531200000L, "day1_1"},
+                             new Object[]{1672531200000L, "day1_2"},
+                             new Object[]{1675209600000L, "day2"}
+                         )
+                     )
+                     .verifyResults();
+  }
+
   @MethodSource("data")
   @ParameterizedTest(name = "{index}:with context {0}")
   public void testInsertLimitWithPeriodGranularityThrowsException(String contextName, Map<String, Object> context)
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
index 174e09243ae..7d7f4e310c6 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
@@ -41,7 +41,9 @@ import org.apache.druid.indexing.common.task.Tasks;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.java.util.common.granularity.GranularityType;
+import org.apache.druid.msq.indexing.error.TooManySegmentsInTimeChunkFault;
 import org.apache.druid.msq.indexing.report.MSQSegmentReport;
 import org.apache.druid.msq.test.CounterSnapshotMatcher;
 import org.apache.druid.msq.test.MSQTestBase;
@@ -753,6 +755,68 @@ public class MSQReplaceTest extends MSQTestBase
                      .verifyResults();
   }
 
+  @Test
+  public void testReplaceWithTooManySegmentsInTimeChunk()
+  {
+    final Map<String, Object> context = ImmutableMap.<String, Object>builder()
+                                                    .putAll(DEFAULT_MSQ_CONTEXT)
+                                                    .put("maxNumSegments", 1)
+                                                    .put("rowsPerSegment", 1)
+                                                    .build();
+
+    testIngestQuery().setSql("REPLACE INTO foo"
+                             + " OVERWRITE ALL "
+                             + " SELECT TIME_PARSE(ts) AS __time, c1 "
+                             + " FROM (VALUES('2023-01-01 01:00:00', 'day1_1'), ('2023-01-01 01:00:00', 'day1_2'), ('2023-02-01 06:00:00', 'day2')) AS t(ts, c1)"
+                             + " PARTITIONED BY HOUR")
+                     .setExpectedDataSource("foo")
+                     .setExpectedRowSignature(RowSignature.builder().add("__time", ColumnType.LONG).build())
+                     .setQueryContext(context)
+                     .setExpectedMSQFault(
+                         new TooManySegmentsInTimeChunkFault(
+                             DateTimes.of("2023-01-01T01:00:00.000Z"),
+                             2,
+                             1,
+                             Granularities.HOUR
+                         )
+                     )
+                     .verifyResults();
+
+  }
+
+  @Test
+  public void testReplaceWithMaxNumSegments()
+  {
+    final Map<String, Object> context = ImmutableMap.<String, Object>builder()
+                                                    .putAll(DEFAULT_MSQ_CONTEXT)
+                                                    .put("maxNumSegments", 1)
+                                                    .build();
+
+    final RowSignature expectedRowSignature = RowSignature.builder()
+                                                          .add("__time", ColumnType.LONG)
+                                                          .add("c1", ColumnType.STRING)
+                                                          .build();
+
+    // Ingest query should generate at most 1 segment for all the rows.
+    testIngestQuery().setSql("REPLACE INTO foo"
+                             + " OVERWRITE ALL"
+                             + " SELECT TIME_PARSE(ts) AS __time, c1 "
+                             + " FROM (VALUES('2023-01-01', 'day1_1'), ('2023-01-01', 'day1_2'), ('2023-02-01', 'day2')) AS t(ts, c1)"
+                             + " LIMIT 10"
+                             + " PARTITIONED BY ALL")
+                     .setQueryContext(context)
+                     .setExpectedDataSource("foo")
+                     .setExpectedRowSignature(expectedRowSignature)
+                     .setExpectedResultRows(
+                         ImmutableList.of(
+                             new Object[]{1672531200000L, "day1_1"},
+                             new Object[]{1672531200000L, "day1_2"},
+                             new Object[]{1675209600000L, "day2"}
+                         )
+                     )
+                     .verifyResults();
+  }
+
   @MethodSource("data")
   @ParameterizedTest(name = "{index}:with context {0}")
   public void testReplaceLimitWithPeriodGranularityThrowsException(String contextName, Map<String, Object> context)
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQTuningConfigTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQTuningConfigTest.java
index 44d22b3d50f..45d93001386 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQTuningConfigTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQTuningConfigTest.java
@@ -53,6 +53,7 @@ public class MSQTuningConfigTest
         2,
         3,
         4,
+        10,
         IndexSpec.builder()
                  .withStringDictionaryEncoding(
                      new StringEncodingStrategy.FrontCoded(null, FrontCodedIndexed.V1)
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/error/MSQFaultSerdeTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/error/MSQFaultSerdeTest.java
index 6ee9a5b5276..c33faa40c14 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/error/MSQFaultSerdeTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/error/MSQFaultSerdeTest.java
@@ -22,7 +22,9 @@ package org.apache.druid.msq.indexing.error;
 import com.fasterxml.jackson.core.JsonParser;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import nl.jqno.equalsverifier.EqualsVerifier;
+import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.msq.guice.MSQIndexingModule;
 import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.column.ColumnType;
@@ -84,6 +86,7 @@ public class MSQFaultSerdeTest
     assertFaultSerde(new TooManyInputFilesFault(15, 10, 5));
     assertFaultSerde(new TooManyPartitionsFault(10));
     assertFaultSerde(new TooManyRowsWithSameKeyFault(Arrays.asList("foo", 123), 1, 2));
+    assertFaultSerde(new TooManySegmentsInTimeChunkFault(DateTimes.nowUtc(), 10, 1, Granularities.ALL));
     assertFaultSerde(new TooManyWarningsFault(10, "the error"));
     assertFaultSerde(new TooManyWorkersFault(10, 5));
     assertFaultSerde(new TooManyAttemptsForWorker(2, "taskId", 1, "rootError"));
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
index 33c1374d2a7..f7c9b3296ca 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
@@ -834,6 +834,10 @@ public class MSQTestBase extends BaseCalciteQueryTest
         expectedTuningConfig.getRowsPerSegment(),
         tuningConfig.getRowsPerSegment()
     );
+    Assert.assertEquals(
+        expectedTuningConfig.getMaxNumSegments(),
+        tuningConfig.getMaxNumSegments()
+    );
   }
 
   @Nullable

From ab76d851ad33f1c267cd59bf6b66858969452310 Mon Sep 17 00:00:00 2001
From: Andreas Maechler <amaechler@gmail.com>
Date: Wed, 26 Jun 2024 11:30:52 -0600
Subject: [PATCH 28/72] Update docs contribution with correct script (#16581)

* Spacing

* Fix ordering

* npm run start
---
 docs/development/docs-contribute.md | 36 +++++++++++++++--------------
 1 file changed, 19 insertions(+), 17 deletions(-)

diff --git a/docs/development/docs-contribute.md b/docs/development/docs-contribute.md
index d50b86b4478..eb0aa3bb72e 100644
--- a/docs/development/docs-contribute.md
+++ b/docs/development/docs-contribute.md
@@ -34,8 +34,7 @@ Druid docs contributors:
 Druid docs contributors can open an issue about documentation, or contribute a change with a pull request (PR).
 
 The open source Druid docs are located here:
-https://druid.apache.org/docs/latest/design/index.html
-
+<https://druid.apache.org/docs/latest/design/index.html>
 
 If you need to update a Druid doc, locate and update the doc in the Druid repo following the instructions below.
 
@@ -48,19 +47,22 @@ See [`CONTRIBUTING.md`](https://github.com/apache/incubator-druid/blob/master/CO
 ## Before you begin
 
 Before you can contribute to the Druid docs for the first time, you must complete the following steps:
+
 1. Fork the [Druid repo](https://github.com/apache/druid). Your fork will be the `origin` remote.
-2. Clone your fork: 
-   
+2. Clone your fork:
+
    ```bash
    git clone git@github.com:GITHUB_USERNAME/druid.git
    ```
+
    Replace `GITHUB_USERNAME` with your GitHub username.
 3. In the directory where you cloned your fork, set up `apache/druid`  as your your remote `upstream` repo:
-   
+
    ```bash
    git remote add upstream https://github.com/apache/druid.git
    ```
-4. Confirm that your fork shows up as the origin repo and `apache/druid` shows up as the upstream repo:   
+
+4. Confirm that your fork shows up as the origin repo and `apache/druid` shows up as the upstream repo:
 
    ```bash
    git remote -v
@@ -71,11 +73,11 @@ Before you can contribute to the Druid docs for the first time, you must complet
    ```bash
    git config user.email
    ```
-   
+
    If you need to set your email, see the [GitHub instructions](https://docs.github.com/en/github-ae@latest/account-and-profile/setting-up-and-managing-your-github-user-account/managing-email-preferences/setting-your-commit-email-address#setting-your-commit-email-address-in-git).
 
-5. Install Docusaurus so that you can build the site locally. Run either `npm install` or `yarn install` in the `website` directory.
-   
+6. Install Docusaurus so that you can build the site locally. Run either `npm install` or `yarn install` in the `website` directory.
+
 ## Contributing
 
 Before you contribute, make sure your local branch of `master` and the upstream Apache branch are up-to-date and in sync. This can help you avoid merge conflicts. Run the following commands on your fork's `master` branch:
@@ -104,13 +106,13 @@ Now you're up to date, and you can make your changes.
    Provide a name for your feature branch in `MY-BRANCH`.
 
 2. Find the file that you want to make changes to. All the source files for the docs are written in Markdown and located in the `docs` directory. The URL for the page includes the subdirectory the source file is in. For example, the SQL-based ingestion tutorial found at `https://druid.apache.org/docs/latest/tutorials/tutorial-msq-extern.html` is in the `tutorials` subdirectory.
-   
+
    If you're adding a page, create a new Markdown file in the appropriate subdirectory. Then, copy the front matter and Apache license from an existing file. Update the `title` and `id` fields. Don't forget to add it to `website/sidebars.json` so that your new page shows up in the navigation.
 
-4. Test changes locally by building the site and navigating to your changes. In the `website` directory, run `docusaurus-start`. By default, this starts the site on `localhost:3000`. If port `3000` is already in use, it'll increment the port number from there.
-   
-5. Use the following commands to run the link and spellcheckers locally: 
-   
+3. Test changes locally by building the site and navigating to your changes. In the `website` directory, run `npm run start`. By default, this starts the site on `localhost:3000`. If port `3000` is already in use, it'll increment the port number from there.
+
+4. Use the following commands to run the link and spellcheckers locally:
+
    ```bash
    cd website
    # You only need to install once
@@ -123,7 +125,7 @@ Now you're up to date, and you can make your changes.
 
    This step can save you time during the review process since they'll run faster than the GitHub Action version of the checks and warn you of issues before you create a PR.
 
-5. Push your changes to your fork: 
+5. Push your changes to your fork:
 
    ```bash
    git push --set-upstream origin MY-BRANCH
@@ -133,7 +135,7 @@ Now you're up to date, and you can make your changes.
 
 The pull request template is extensive. You may not need all the information there, so feel free to delete unneeded sections as you fill it out. Once you create the pull request, GitHub automatically labels the issue so that reviewers can take a look.
 
-The docs go through a review process similar to the code where community members will offer feedback. Once the review process is complete and your changes are merged, they'll be available on the live site when the site gets republished. 
+The docs go through a review process similar to the code where community members will offer feedback. Once the review process is complete and your changes are merged, they'll be available on the live site when the site gets republished.
 
 ## Style guide
 
@@ -146,6 +148,7 @@ The style guide should serve as a point of reference to enable contributors and
 In some cases, Google Style might make the Druid docs more difficult to read and understand. This section highlights those exceptions.
 
 #### SQL keyword syntax
+
 For SQL keywords and functions, use all caps, but do not use code font.
 
 :::tip
@@ -159,7 +162,6 @@ The UNNEST clause unnests array values.
 The \`UNNEST\` clause unnests array values.
 :::
 
-
 #### Optional parameters and arguments
 
 For optional parameters and arguments, enclose the optional parameter and leading command in brackets.

From d4f2636325f3a0c14f4572ea1bbb4efa54307f24 Mon Sep 17 00:00:00 2001
From: Clint Wylie <cwylie@apache.org>
Date: Wed, 26 Jun 2024 12:59:42 -0700
Subject: [PATCH 29/72] fix greatest/least function non-vectorized processing
 to ignore null argument types (#16649)

---
 .../src/main/java/org/apache/druid/math/expr/Function.java | 7 +++----
 .../test/java/org/apache/druid/math/expr/FunctionTest.java | 2 ++
 .../sql/calcite/expression/GreatestExpressionTest.java     | 4 ++--
 .../druid/sql/calcite/expression/LeastExpressionTest.java  | 4 ++--
 4 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/processing/src/main/java/org/apache/druid/math/expr/Function.java b/processing/src/main/java/org/apache/druid/math/expr/Function.java
index 48bc0570aaa..d62d632f40b 100644
--- a/processing/src/main/java/org/apache/druid/math/expr/Function.java
+++ b/processing/src/main/java/org/apache/druid/math/expr/Function.java
@@ -622,11 +622,10 @@ public interface Function extends NamedFunction
         ExprEval<?> exprEval = expr.eval(bindings);
         ExpressionType exprType = exprEval.type();
 
-        if (isValidType(exprType)) {
-          outputType = ExpressionTypeConversion.function(outputType, exprType);
-        }
-
         if (exprEval.value() != null) {
+          if (isValidType(exprType)) {
+            outputType = ExpressionTypeConversion.function(outputType, exprType);
+          }
           evals.add(exprEval);
         }
       }
diff --git a/processing/src/test/java/org/apache/druid/math/expr/FunctionTest.java b/processing/src/test/java/org/apache/druid/math/expr/FunctionTest.java
index d6143fd1fa1..56b3583031f 100644
--- a/processing/src/test/java/org/apache/druid/math/expr/FunctionTest.java
+++ b/processing/src/test/java/org/apache/druid/math/expr/FunctionTest.java
@@ -677,6 +677,7 @@ public class FunctionTest extends InitializedNullHandlingTest
     assertExpr("greatest()", null);
     assertExpr("greatest(null, null)", null);
     assertExpr("greatest(1, null, 'A')", "A");
+    assertExpr("greatest(1.0, 1, null)", 1.0);
   }
 
   @Test
@@ -703,6 +704,7 @@ public class FunctionTest extends InitializedNullHandlingTest
     assertExpr("least()", null);
     assertExpr("least(null, null)", null);
     assertExpr("least(1, null, 'A')", "1");
+    assertExpr("least(1.0, 1, null)", 1.0);
   }
 
   @Test
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/expression/GreatestExpressionTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/expression/GreatestExpressionTest.java
index f1a5a869a19..893b5449934 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/expression/GreatestExpressionTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/expression/GreatestExpressionTest.java
@@ -214,7 +214,7 @@ public class GreatestExpressionTest extends CalciteTestBase
   }
 
   @Test
-  public void testDecimalWithNullShouldReturnString()
+  public void testDecimalWithNullShouldNotReturnString()
   {
     testExpression(
         Arrays.asList(
@@ -227,7 +227,7 @@ public class GreatestExpressionTest extends CalciteTestBase
             null,
             3.4
         ),
-        "3.4"
+        3.4
     );
   }
   @Test
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/expression/LeastExpressionTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/expression/LeastExpressionTest.java
index eaec03c00c8..e2d1bbf306e 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/expression/LeastExpressionTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/expression/LeastExpressionTest.java
@@ -214,7 +214,7 @@ public class LeastExpressionTest extends CalciteTestBase
   }
 
   @Test
-  public void testDecimalWithNullShouldReturnString()
+  public void testDecimalWithNullShouldNotReturnString()
   {
     testExpression(
         Arrays.asList(
@@ -227,7 +227,7 @@ public class LeastExpressionTest extends CalciteTestBase
             3.4,
             null
         ),
-        "1.2"
+        1.2
     );
   }
 

From dbed1b0f505b1d8258906b5738db4390e9caffd8 Mon Sep 17 00:00:00 2001
From: Gian Merlino <gianmerlino@gmail.com>
Date: Wed, 26 Jun 2024 17:28:36 -0700
Subject: [PATCH 30/72] Defer more expressions in vectorized groupBy. (#16338)

* Defer more expressions in vectorized groupBy.

This patch adds a way for columns to provide GroupByVectorColumnSelectors,
which controls how the groupBy engine operates on them. This mechanism is used
by ExpressionVirtualColumn to provide an ExpressionDeferredGroupByVectorColumnSelector
that uses the inputs of an expression as the grouping key. The actual expression
evaluation is deferred until the grouped ResultRow is created.

A new context parameter "deferExpressionDimensions" allows users to control when
this deferred selector is used. The default is "fixedWidthNonNumeric", which is a
behavioral change from the prior behavior. Users can get the prior behavior by setting
this to "singleString".

* Fix style.

* Add deferExpressionDimensions to SqlExpressionBenchmark.

* Fix style.

* Fix inspections.

* Add more testing.

* Use valueOrDefault.

* Compute exprKeyBytes a bit lighter-weight.
---
 .../query/SqlExpressionBenchmark.java         |  12 +-
 docs/querying/groupbyquery.md                 |   2 +-
 .../groupby/DeferExpressionDimensions.java    | 197 ++++++++++++++++++
 .../query/groupby/GroupByQueryConfig.java     |  17 ++
 .../vector/VectorGroupByEngine.java           |  17 +-
 .../apache/druid/segment/VirtualColumn.java   |  25 ++-
 ...yableIndexVectorColumnSelectorFactory.java |  31 +++
 .../vector/VectorColumnSelectorFactory.java   |  32 ++-
 ...onDeferredGroupByVectorColumnSelector.java | 123 +++++++++++
 .../virtual/ExpressionVectorSelectors.java    |  50 +++++
 .../virtual/ExpressionVirtualColumn.java      |  24 +++
 .../query/groupby/GroupByQueryConfigTest.java |   6 +
 .../query/groupby/GroupByQueryRunnerTest.java |  34 +++
 .../ExpressionVectorSelectorsTest.java        |  38 +++-
 14 files changed, 593 insertions(+), 15 deletions(-)
 create mode 100644 processing/src/main/java/org/apache/druid/query/groupby/DeferExpressionDimensions.java
 create mode 100644 processing/src/main/java/org/apache/druid/segment/virtual/ExpressionDeferredGroupByVectorColumnSelector.java

diff --git a/benchmarks/src/test/java/org/apache/druid/benchmark/query/SqlExpressionBenchmark.java b/benchmarks/src/test/java/org/apache/druid/benchmark/query/SqlExpressionBenchmark.java
index d4c2e0906b4..8b2172182a0 100644
--- a/benchmarks/src/test/java/org/apache/druid/benchmark/query/SqlExpressionBenchmark.java
+++ b/benchmarks/src/test/java/org/apache/druid/benchmark/query/SqlExpressionBenchmark.java
@@ -37,6 +37,7 @@ import org.apache.druid.math.expr.ExpressionProcessing;
 import org.apache.druid.query.DruidProcessingConfig;
 import org.apache.druid.query.QueryContexts;
 import org.apache.druid.query.QueryRunnerFactoryConglomerate;
+import org.apache.druid.query.groupby.GroupByQueryConfig;
 import org.apache.druid.segment.AutoTypeColumnSchema;
 import org.apache.druid.segment.IndexSpec;
 import org.apache.druid.segment.QueryableIndex;
@@ -236,6 +237,14 @@ public class SqlExpressionBenchmark
   })
   private String schema;
 
+  @Param({
+      "singleString",
+      "fixedWidth",
+      "fixedWidthNonNumeric",
+      "always"
+  })
+  private String deferExpressionDimensions;
+
   @Param({
       // non-expression reference
       "0",
@@ -414,7 +423,8 @@ public class SqlExpressionBenchmark
   {
     final Map<String, Object> context = ImmutableMap.of(
         QueryContexts.VECTORIZE_KEY, vectorize,
-        QueryContexts.VECTORIZE_VIRTUAL_COLUMNS_KEY, vectorize
+        QueryContexts.VECTORIZE_VIRTUAL_COLUMNS_KEY, vectorize,
+        GroupByQueryConfig.CTX_KEY_DEFER_EXPRESSION_DIMENSIONS, deferExpressionDimensions
     );
     final String sql = QUERIES.get(Integer.parseInt(query));
     try (final DruidPlanner planner = plannerFactory.createPlannerForTesting(engine, sql, context)) {
diff --git a/docs/querying/groupbyquery.md b/docs/querying/groupbyquery.md
index 935bd90a145..a11f82d124a 100644
--- a/docs/querying/groupbyquery.md
+++ b/docs/querying/groupbyquery.md
@@ -385,7 +385,7 @@ Supported query contexts:
 |`forceLimitPushDown`|When all fields in the orderby are part of the grouping key, the Broker will push limit application down to the Historical processes. When the sorting order uses fields that are not in the grouping key, applying this optimization can result in approximate results with unknown accuracy, so this optimization is disabled by default in that case. Enabling this context flag turns on limit push down for limit/orderbys that contain non-grouping key columns.|false|
 |`applyLimitPushDownToSegment`|If Broker pushes limit down to queryable nodes (historicals, peons) then limit results during segment scan. This context value can be used to override `druid.query.groupBy.applyLimitPushDownToSegment`.|true|
 |`groupByEnableMultiValueUnnesting`|Safety flag to enable/disable the implicit unnesting on multi value column's as part of the grouping key. 'true' indicates multi-value grouping keys are unnested. 'false' returns an error if a multi value column is found as part of the grouping key.|true|
-
+|`deferExpressionDimensions`|When an entry in `dimensions` references an `expression` virtual column, this property influences whether expression evaluation is deferred from cursor processing to the merge step. Options are:<ul><li>`fixedWidth`: Defer expressions with fixed-width inputs (numeric and dictionary-encoded string).</li><li>`fixedWidthNonNumeric`: Defer expressions with fixed-width inputs (numeric and dictionary-encoded string), unless the expression output and all inputs are numeric.</li><li>`singleString`: Defer string-typed expressions with a single dictionary-encoded string input.</li><li>`always`: Defer all expressions. May require building dictionaries for expression inputs.</li></ul><br />These properties only take effect when the `groupBy` query can be vectorized. Non-vectorized queries only defer string-typed expressions of single string inputs.|`fixedWidthNonNumeric`|
 
 #### Array based result rows
 
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/DeferExpressionDimensions.java b/processing/src/main/java/org/apache/druid/query/groupby/DeferExpressionDimensions.java
new file mode 100644
index 00000000000..3c6621d9038
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/groupby/DeferExpressionDimensions.java
@@ -0,0 +1,197 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.groupby;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonValue;
+import org.apache.druid.java.util.common.IAE;
+import org.apache.druid.math.expr.ExprType;
+import org.apache.druid.query.dimension.DimensionSpec;
+import org.apache.druid.segment.ColumnInspector;
+import org.apache.druid.segment.column.ColumnCapabilities;
+import org.apache.druid.segment.column.ValueType;
+import org.apache.druid.segment.vector.VectorColumnSelectorFactory;
+import org.apache.druid.segment.virtual.ExpressionPlan;
+import org.apache.druid.segment.virtual.ExpressionVirtualColumn;
+
+import java.util.List;
+
+/**
+ * Controls deferral of {@link ExpressionVirtualColumn} in {@link GroupByQuery}.
+ */
+public enum DeferExpressionDimensions
+{
+  SINGLE_STRING("singleString") {
+    @Override
+    public boolean useDeferredGroupBySelector(
+        ExpressionPlan plan,
+        List<String> requiredBindingsList,
+        ColumnInspector inspector
+    )
+    {
+      return false;
+    }
+  },
+
+  /**
+   * Defer expressions when their input variables are all fixed-width types (primitive numbers, or dictionary encoded).
+   */
+  FIXED_WIDTH("fixedWidth") {
+    @Override
+    public boolean useDeferredGroupBySelector(
+        ExpressionPlan plan,
+        List<String> requiredBindingsList,
+        ColumnInspector inspector
+    )
+    {
+      if (isInnatelyDeferrable(plan, requiredBindingsList, inspector)) {
+        return false;
+      }
+
+      for (final String requiredBinding : requiredBindingsList) {
+        final ColumnCapabilities capabilities = inspector.getColumnCapabilities(requiredBinding);
+        if (capabilities == null) {
+          return false;
+        }
+
+        if (!capabilities.isNumeric() && !capabilities.isDictionaryEncoded().isTrue()) {
+          // Not fixed-width.
+          return false;
+        }
+      }
+
+      return true;
+    }
+  },
+
+  /**
+   * Defer expressions when their input variables are all fixed-width types (primitive numbers, or dictionary encoded).
+   */
+  FIXED_WIDTH_NON_NUMERIC("fixedWidthNonNumeric") {
+    @Override
+    public boolean useDeferredGroupBySelector(
+        ExpressionPlan plan,
+        List<String> requiredBindingsList,
+        ColumnInspector inspector
+    )
+    {
+      if (isInnatelyDeferrable(plan, requiredBindingsList, inspector)) {
+        return false;
+      }
+
+      boolean allNumericInputs = true;
+
+      for (final String requiredBinding : requiredBindingsList) {
+        final ColumnCapabilities capabilities = inspector.getColumnCapabilities(requiredBinding);
+        if (capabilities == null) {
+          return false;
+        }
+
+        allNumericInputs = allNumericInputs && capabilities.isNumeric();
+
+        if (!capabilities.isNumeric() && !capabilities.isDictionaryEncoded().isTrue()) {
+          // Not fixed-width.
+          return false;
+        }
+      }
+
+      return !allNumericInputs || (plan.getOutputType() != null && !plan.getOutputType().isNumeric());
+    }
+  },
+
+  ALWAYS("always") {
+    @Override
+    public boolean useDeferredGroupBySelector(
+        ExpressionPlan plan,
+        List<String> requiredBindingsList,
+        ColumnInspector inspector
+    )
+    {
+      return !isInnatelyDeferrable(plan, requiredBindingsList, inspector);
+    }
+  };
+
+  public static final String JSON_KEY = "deferExpressionDimensions";
+
+  private final String jsonName;
+
+  DeferExpressionDimensions(String jsonName)
+  {
+    this.jsonName = jsonName;
+  }
+
+  @JsonCreator
+  public static DeferExpressionDimensions fromString(final String jsonName)
+  {
+    for (final DeferExpressionDimensions value : values()) {
+      if (value.jsonName.equals(jsonName)) {
+        return value;
+      }
+    }
+
+    throw new IAE("Invalid value[%s] for[%s]", jsonName, JSON_KEY);
+  }
+
+  public abstract boolean useDeferredGroupBySelector(
+      ExpressionPlan plan,
+      List<String> requiredBindingsList,
+      ColumnInspector inspector
+  );
+
+  @Override
+  @JsonValue
+  public String toString()
+  {
+    return jsonName;
+  }
+
+  /**
+   * Whether the given expression can be deferred innately by the selector created by
+   * {@link ExpressionVirtualColumn#makeSingleValueVectorDimensionSelector(DimensionSpec, VectorColumnSelectorFactory)}.
+   *
+   * In this case, all options for this enum return false from
+   * {@link #useDeferredGroupBySelector(ExpressionPlan, List, ColumnInspector)}, because there is no need to defer
+   * redundantly.
+   */
+  private static boolean isInnatelyDeferrable(
+      ExpressionPlan plan,
+      List<String> requiredBindingsList,
+      ColumnInspector inspector
+  )
+  {
+    if (plan.getOutputType() != null
+        && plan.getOutputType().is(ExprType.STRING)
+        && requiredBindingsList.size() <= 1) {
+      for (final String requiredBinding : requiredBindingsList) {
+        final ColumnCapabilities requiredBindingCapabilities = inspector.getColumnCapabilities(requiredBinding);
+
+        if (requiredBindingCapabilities == null
+            || !requiredBindingCapabilities.is(ValueType.STRING)
+            || !requiredBindingCapabilities.isDictionaryEncoded().isTrue()) {
+          return false;
+        }
+      }
+
+      return true;
+    } else {
+      return false;
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryConfig.java b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryConfig.java
index 2fb4dfdd4d2..9950695f28c 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryConfig.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryConfig.java
@@ -27,6 +27,8 @@ import org.apache.druid.query.QueryContext;
 import org.apache.druid.query.QueryContexts;
 import org.apache.druid.utils.JvmUtils;
 
+import java.util.Optional;
+
 /**
  *
  */
@@ -44,6 +46,7 @@ public class GroupByQueryConfig
   public static final String CTX_KEY_ARRAY_RESULT_ROWS = "resultAsArray";
   public static final String CTX_KEY_ENABLE_MULTI_VALUE_UNNESTING = "groupByEnableMultiValueUnnesting";
   public static final String CTX_KEY_BUFFER_GROUPER_MAX_SIZE = "bufferGrouperMaxSize";
+  public static final String CTX_KEY_DEFER_EXPRESSION_DIMENSIONS = "deferExpressionDimensions";
   private static final String CTX_KEY_IS_SINGLE_THREADED = "groupByIsSingleThreaded";
   private static final String CTX_KEY_BUFFER_GROUPER_INITIAL_BUCKETS = "bufferGrouperInitialBuckets";
   private static final String CTX_KEY_BUFFER_GROUPER_MAX_LOAD_FACTOR = "bufferGrouperMaxLoadFactor";
@@ -119,6 +122,9 @@ public class GroupByQueryConfig
   @JsonProperty
   private boolean mergeThreadLocal = false;
 
+  @JsonProperty
+  private DeferExpressionDimensions deferExpressionDimensions = DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC;
+
   @JsonProperty
   private boolean vectorize = true;
 
@@ -277,6 +283,11 @@ public class GroupByQueryConfig
     return mergeThreadLocal;
   }
 
+  public DeferExpressionDimensions getDeferExpressionDimensions()
+  {
+    return deferExpressionDimensions;
+  }
+
   public boolean isVectorize()
   {
     return vectorize;
@@ -350,6 +361,10 @@ public class GroupByQueryConfig
         getNumParallelCombineThreads()
     );
     newConfig.mergeThreadLocal = queryContext.getBoolean(CTX_KEY_MERGE_THREAD_LOCAL, isMergeThreadLocal());
+    newConfig.deferExpressionDimensions =
+        Optional.ofNullable(queryContext.getString(CTX_KEY_DEFER_EXPRESSION_DIMENSIONS))
+                .map(DeferExpressionDimensions::fromString)
+                .orElse(getDeferExpressionDimensions());
     newConfig.vectorize = queryContext.getBoolean(QueryContexts.VECTORIZE_KEY, isVectorize());
     newConfig.enableMultiValueUnnesting = queryContext.getBoolean(
         CTX_KEY_ENABLE_MULTI_VALUE_UNNESTING,
@@ -378,6 +393,8 @@ public class GroupByQueryConfig
            ", vectorize=" + vectorize +
            ", forcePushDownNestedQuery=" + forcePushDownNestedQuery +
            ", enableMultiValueUnnesting=" + enableMultiValueUnnesting +
+           ", mergeThreadLocal=" + mergeThreadLocal +
+           ", deferExpressionDimensions=" + deferExpressionDimensions +
            '}';
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java
index 7b28f782e31..93633644a2e 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java
@@ -29,6 +29,7 @@ import org.apache.druid.java.util.common.io.Closer;
 import org.apache.druid.java.util.common.parsers.CloseableIterator;
 import org.apache.druid.query.DruidProcessingConfig;
 import org.apache.druid.query.aggregation.AggregatorAdapters;
+import org.apache.druid.query.dimension.DefaultDimensionSpec;
 import org.apache.druid.query.dimension.DimensionSpec;
 import org.apache.druid.query.filter.Filter;
 import org.apache.druid.query.groupby.GroupByQuery;
@@ -137,12 +138,22 @@ public class VectorGroupByEngine
             try {
               final VectorColumnSelectorFactory columnSelectorFactory = cursor.getColumnSelectorFactory();
               final List<GroupByVectorColumnSelector> dimensions = query.getDimensions().stream().map(
-                  dimensionSpec ->
-                      ColumnProcessors.makeVectorProcessor(
+                  dimensionSpec -> {
+                    if (dimensionSpec instanceof DefaultDimensionSpec) {
+                      // Delegate creation of GroupByVectorColumnSelector to the column selector factory, so that
+                      // virtual columns (like ExpressionVirtualColumn) can control their own grouping behavior.
+                      return columnSelectorFactory.makeGroupByVectorColumnSelector(
+                          dimensionSpec.getDimension(),
+                          config.getDeferExpressionDimensions()
+                      );
+                    } else {
+                      return ColumnProcessors.makeVectorProcessor(
                           dimensionSpec,
                           GroupByVectorColumnProcessorFactory.instance(),
                           columnSelectorFactory
-                      )
+                      );
+                    }
+                  }
               ).collect(Collectors.toList());
 
               return new VectorGroupByEngineIterator(
diff --git a/processing/src/main/java/org/apache/druid/segment/VirtualColumn.java b/processing/src/main/java/org/apache/druid/segment/VirtualColumn.java
index 3698a8a731b..ca9408d14e4 100644
--- a/processing/src/main/java/org/apache/druid/segment/VirtualColumn.java
+++ b/processing/src/main/java/org/apache/druid/segment/VirtualColumn.java
@@ -24,6 +24,8 @@ import com.fasterxml.jackson.annotation.JsonTypeInfo;
 import org.apache.druid.java.util.common.Cacheable;
 import org.apache.druid.query.dimension.DimensionSpec;
 import org.apache.druid.query.filter.ColumnIndexSelector;
+import org.apache.druid.query.groupby.DeferExpressionDimensions;
+import org.apache.druid.query.groupby.epinephelinae.vector.GroupByVectorColumnSelector;
 import org.apache.druid.segment.column.ColumnCapabilities;
 import org.apache.druid.segment.column.ColumnIndexSupplier;
 import org.apache.druid.segment.data.ReadableOffset;
@@ -240,6 +242,26 @@ public interface VirtualColumn extends Cacheable
     return null;
   }
 
+  /**
+   * Returns a group-by selector. Allows virtual columns to control their own grouping behavior.
+   *
+   * @param columnName                column name
+   * @param factory                   column selector factory
+   * @param deferExpressionDimensions active value of {@link org.apache.druid.query.groupby.GroupByQueryConfig#CTX_KEY_DEFER_EXPRESSION_DIMENSIONS}
+   *
+   * @return selector, or null if this virtual column does not have a specialized one
+   */
+  @SuppressWarnings("unused")
+  @Nullable
+  default GroupByVectorColumnSelector makeGroupByVectorColumnSelector(
+      String columnName,
+      VectorColumnSelectorFactory factory,
+      DeferExpressionDimensions deferExpressionDimensions
+  )
+  {
+    return null;
+  }
+
   /**
    * This method is deprecated in favor of {@link #capabilities(ColumnInspector, String)}, which should be used whenever
    * possible and can support virtual column implementations that need to inspect other columns as inputs.
@@ -265,8 +287,9 @@ public interface VirtualColumn extends Cacheable
    * Examples of this include the {@link ExpressionVirtualColumn}, which takes input from other columns and uses the
    * {@link ColumnInspector} to infer the output type of expressions based on the types of the inputs.
    *
-   * @param inspector column inspector to provide additional information of other available columns
+   * @param inspector  column inspector to provide additional information of other available columns
    * @param columnName the name this virtual column was referenced with
+   *
    * @return capabilities, must not be null
    */
   @Nullable
diff --git a/processing/src/main/java/org/apache/druid/segment/vector/QueryableIndexVectorColumnSelectorFactory.java b/processing/src/main/java/org/apache/druid/segment/vector/QueryableIndexVectorColumnSelectorFactory.java
index 79d31ee479d..3e5bedb5cdc 100644
--- a/processing/src/main/java/org/apache/druid/segment/vector/QueryableIndexVectorColumnSelectorFactory.java
+++ b/processing/src/main/java/org/apache/druid/segment/vector/QueryableIndexVectorColumnSelectorFactory.java
@@ -21,8 +21,13 @@ package org.apache.druid.segment.vector;
 
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.query.dimension.DimensionSpec;
+import org.apache.druid.query.groupby.DeferExpressionDimensions;
+import org.apache.druid.query.groupby.epinephelinae.vector.GroupByVectorColumnProcessorFactory;
+import org.apache.druid.query.groupby.epinephelinae.vector.GroupByVectorColumnSelector;
 import org.apache.druid.segment.ColumnCache;
+import org.apache.druid.segment.ColumnProcessors;
 import org.apache.druid.segment.QueryableIndex;
+import org.apache.druid.segment.VirtualColumn;
 import org.apache.druid.segment.VirtualColumns;
 import org.apache.druid.segment.column.BaseColumn;
 import org.apache.druid.segment.column.ColumnCapabilities;
@@ -247,6 +252,32 @@ public class QueryableIndexVectorColumnSelectorFactory implements VectorColumnSe
     return columnValueSelector;
   }
 
+  @Override
+  public GroupByVectorColumnSelector makeGroupByVectorColumnSelector(
+      String column,
+      DeferExpressionDimensions deferExpressionDimensions
+  )
+  {
+    GroupByVectorColumnSelector retVal = null;
+
+    // Allow virtual columns to control their own grouping behavior.
+    final VirtualColumn virtualColumn = virtualColumns.getVirtualColumn(column);
+    if (virtualColumn != null) {
+      retVal = virtualColumn.makeGroupByVectorColumnSelector(column, this, deferExpressionDimensions);
+    }
+
+    // Generic case: use GroupByVectorColumnProcessorFactory.instance() to build selectors for primitive types.
+    if (retVal == null) {
+      retVal = ColumnProcessors.makeVectorProcessor(
+          column,
+          GroupByVectorColumnProcessorFactory.instance(),
+          this
+      );
+    }
+
+    return retVal;
+  }
+
   @Nullable
   @Override
   public ColumnCapabilities getColumnCapabilities(final String columnName)
diff --git a/processing/src/main/java/org/apache/druid/segment/vector/VectorColumnSelectorFactory.java b/processing/src/main/java/org/apache/druid/segment/vector/VectorColumnSelectorFactory.java
index 56b14898ac6..de129d564bf 100644
--- a/processing/src/main/java/org/apache/druid/segment/vector/VectorColumnSelectorFactory.java
+++ b/processing/src/main/java/org/apache/druid/segment/vector/VectorColumnSelectorFactory.java
@@ -20,7 +20,11 @@
 package org.apache.druid.segment.vector;
 
 import org.apache.druid.query.dimension.DimensionSpec;
+import org.apache.druid.query.groupby.DeferExpressionDimensions;
+import org.apache.druid.query.groupby.epinephelinae.vector.GroupByVectorColumnProcessorFactory;
+import org.apache.druid.query.groupby.epinephelinae.vector.GroupByVectorColumnSelector;
 import org.apache.druid.segment.ColumnInspector;
+import org.apache.druid.segment.ColumnProcessors;
 import org.apache.druid.segment.column.ColumnCapabilities;
 
 import javax.annotation.Nullable;
@@ -30,7 +34,7 @@ import javax.annotation.Nullable;
  *
  * If you need to write code that adapts to different input types, you should write a
  * {@link org.apache.druid.segment.VectorColumnProcessorFactory} and use one of the
- * {@link org.apache.druid.segment.ColumnProcessors#makeVectorProcessor} functions instead of using this class.
+ * {@link ColumnProcessors#makeVectorProcessor} functions instead of using this class.
  *
  * @see org.apache.druid.segment.ColumnSelectorFactory the non-vectorized version.
  */
@@ -61,7 +65,7 @@ public interface VectorColumnSelectorFactory extends ColumnInspector
    *
    * If you need to write code that adapts to different input types, you should write a
    * {@link org.apache.druid.segment.VectorColumnProcessorFactory} and use one of the
-   * {@link org.apache.druid.segment.ColumnProcessors#makeVectorProcessor} functions instead of using this method.
+   * {@link ColumnProcessors#makeVectorProcessor} functions instead of using this method.
    */
   SingleValueDimensionVectorSelector makeSingleValueDimensionSelector(DimensionSpec dimensionSpec);
 
@@ -72,7 +76,7 @@ public interface VectorColumnSelectorFactory extends ColumnInspector
    *
    * If you need to write code that adapts to different input types, you should write a
    * {@link org.apache.druid.segment.VectorColumnProcessorFactory} and use one of the
-   * {@link org.apache.druid.segment.ColumnProcessors#makeVectorProcessor} functions instead of using this method.
+   * {@link ColumnProcessors#makeVectorProcessor} functions instead of using this method.
    */
   MultiValueDimensionVectorSelector makeMultiValueDimensionSelector(DimensionSpec dimensionSpec);
 
@@ -82,7 +86,7 @@ public interface VectorColumnSelectorFactory extends ColumnInspector
    *
    * If you need to write code that adapts to different input types, you should write a
    * {@link org.apache.druid.segment.VectorColumnProcessorFactory} and use one of the
-   * {@link org.apache.druid.segment.ColumnProcessors#makeVectorProcessor} functions instead of using this method.
+   * {@link ColumnProcessors#makeVectorProcessor} functions instead of using this method.
    */
   VectorValueSelector makeValueSelector(String column);
 
@@ -97,7 +101,7 @@ public interface VectorColumnSelectorFactory extends ColumnInspector
    *
    * If you need to write code that adapts to different input types, you should write a
    * {@link org.apache.druid.segment.VectorColumnProcessorFactory} and use one of the
-   * {@link org.apache.druid.segment.ColumnProcessors#makeVectorProcessor} functions instead of using this method.
+   * {@link ColumnProcessors#makeVectorProcessor} functions instead of using this method.
    */
   VectorObjectSelector makeObjectSelector(String column);
 
@@ -110,4 +114,22 @@ public interface VectorColumnSelectorFactory extends ColumnInspector
   @Override
   @Nullable
   ColumnCapabilities getColumnCapabilities(String column);
+
+  /**
+   * Returns a group-by selector. Allows columns to control their own grouping behavior.
+   *
+   * @param column                    column name
+   * @param deferExpressionDimensions active value of {@link org.apache.druid.query.groupby.GroupByQueryConfig#CTX_KEY_DEFER_EXPRESSION_DIMENSIONS}
+   */
+  default GroupByVectorColumnSelector makeGroupByVectorColumnSelector(
+      String column,
+      DeferExpressionDimensions deferExpressionDimensions
+  )
+  {
+    return ColumnProcessors.makeVectorProcessor(
+        column,
+        GroupByVectorColumnProcessorFactory.instance(),
+        this
+    );
+  }
 }
diff --git a/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionDeferredGroupByVectorColumnSelector.java b/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionDeferredGroupByVectorColumnSelector.java
new file mode 100644
index 00000000000..82e8a1f8eb8
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionDeferredGroupByVectorColumnSelector.java
@@ -0,0 +1,123 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment.virtual;
+
+import org.apache.datasketches.memory.WritableMemory;
+import org.apache.druid.math.expr.Expr;
+import org.apache.druid.math.expr.ExpressionType;
+import org.apache.druid.math.expr.InputBindings;
+import org.apache.druid.query.groupby.ResultRow;
+import org.apache.druid.query.groupby.epinephelinae.collection.MemoryPointer;
+import org.apache.druid.query.groupby.epinephelinae.vector.GroupByVectorColumnSelector;
+import org.apache.druid.segment.column.RowSignature;
+
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+
+/**
+ * Implementation of {@link GroupByVectorColumnSelector} that uses a wide key representing all expression inputs
+ * to enable deferring expression evaluation to {@link #writeKeyToResultRow(MemoryPointer, int, ResultRow, int)}.
+ *
+ * For example, the expression "coalesce(x, y)" would write a key composed of (x, y) in {@link #writeKeys}, then
+ * compute "coalesce(x, y)" in {@link #writeKeyToResultRow}.
+ */
+public class ExpressionDeferredGroupByVectorColumnSelector implements GroupByVectorColumnSelector
+{
+  private final Expr expr;
+  private final List<GroupByVectorColumnSelector> subSelectors;
+  private final int exprKeyBytes;
+
+  /**
+   * Used internally by {@link #writeKeyToResultRow(MemoryPointer, int, ResultRow, int)} to populate inputs
+   * for the expression.
+   */
+  private final ResultRow tmpResultRow;
+
+  /**
+   * Used internally by {@link #writeKeyToResultRow(MemoryPointer, int, ResultRow, int)} to evaluate the expression
+   * on {@link #tmpResultRow}.
+   */
+  private final Expr.ObjectBinding tmpResultRowBindings;
+
+  ExpressionDeferredGroupByVectorColumnSelector(
+      final Expr expr,
+      final RowSignature exprInputSignature,
+      final List<GroupByVectorColumnSelector> subSelectors
+  )
+  {
+    this.expr = expr;
+    this.subSelectors = subSelectors;
+    this.tmpResultRow = ResultRow.create(subSelectors.size());
+
+    int exprKeyBytesTmp = 0;
+    final Map<String, InputBindings.InputSupplier<?>> tmpResultRowSuppliers = new HashMap<>();
+    for (int i = 0; i < exprInputSignature.size(); i++) {
+      final int columnPosition = i;
+      exprKeyBytesTmp += subSelectors.get(i).getGroupingKeySize();
+      tmpResultRowSuppliers.put(
+          exprInputSignature.getColumnName(i),
+          InputBindings.inputSupplier(
+              ExpressionType.fromColumnType(exprInputSignature.getColumnType(columnPosition).orElse(null)),
+              () -> tmpResultRow.getArray()[columnPosition]
+          )
+      );
+    }
+    this.exprKeyBytes = exprKeyBytesTmp;
+    this.tmpResultRowBindings = InputBindings.forInputSuppliers(tmpResultRowSuppliers);
+  }
+
+  @Override
+  public int getGroupingKeySize()
+  {
+    return exprKeyBytes;
+  }
+
+  @Override
+  public int writeKeys(WritableMemory keySpace, int keySize, int keyOffset, int startRow, int endRow)
+  {
+    int retVal = 0;
+    for (final GroupByVectorColumnSelector subSelector : subSelectors) {
+      retVal += subSelector.writeKeys(keySpace, keySize, keyOffset, startRow, endRow);
+      keyOffset += subSelector.getGroupingKeySize();
+    }
+    return retVal;
+  }
+
+  @Override
+  public void writeKeyToResultRow(MemoryPointer keyMemory, int keyOffset, ResultRow resultRow, int resultRowPosition)
+  {
+    for (int i = 0; i < subSelectors.size(); i++) {
+      final GroupByVectorColumnSelector subSelector = subSelectors.get(i);
+      subSelector.writeKeyToResultRow(keyMemory, keyOffset, tmpResultRow, i);
+      keyOffset += subSelector.getGroupingKeySize();
+    }
+
+    resultRow.getArray()[resultRowPosition] = expr.eval(tmpResultRowBindings).valueOrDefault();
+  }
+
+  @Override
+  public void reset()
+  {
+    for (final GroupByVectorColumnSelector subSelector : subSelectors) {
+      subSelector.reset();
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionVectorSelectors.java b/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionVectorSelectors.java
index 654a734e375..5c022cbf305 100644
--- a/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionVectorSelectors.java
+++ b/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionVectorSelectors.java
@@ -28,8 +28,11 @@ import org.apache.druid.math.expr.vector.CastToTypeVectorProcessor;
 import org.apache.druid.math.expr.vector.ExprVectorProcessor;
 import org.apache.druid.math.expr.vector.VectorProcessors;
 import org.apache.druid.query.dimension.DefaultDimensionSpec;
+import org.apache.druid.query.groupby.DeferExpressionDimensions;
+import org.apache.druid.query.groupby.epinephelinae.vector.GroupByVectorColumnSelector;
 import org.apache.druid.segment.column.ColumnCapabilities;
 import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.segment.vector.ConstantVectorSelectors;
 import org.apache.druid.segment.vector.ReadableVectorInspector;
 import org.apache.druid.segment.vector.SingleValueDimensionVectorSelector;
@@ -37,6 +40,8 @@ import org.apache.druid.segment.vector.VectorColumnSelectorFactory;
 import org.apache.druid.segment.vector.VectorObjectSelector;
 import org.apache.druid.segment.vector.VectorValueSelector;
 
+import javax.annotation.Nullable;
+import java.util.ArrayList;
 import java.util.List;
 
 public class ExpressionVectorSelectors
@@ -107,6 +112,51 @@ public class ExpressionVectorSelectors
     return new ExpressionVectorObjectSelector(processor, bindings);
   }
 
+  /**
+   * Creates a {@link ExpressionDeferredGroupByVectorColumnSelector} for the provided expression, if the
+   * provided {@link DeferExpressionDimensions} says we should.
+   *
+   * @param factory                   column selector factory
+   * @param expression                expression
+   * @param deferExpressionDimensions active value of {@link org.apache.druid.query.groupby.GroupByQueryConfig#CTX_KEY_DEFER_EXPRESSION_DIMENSIONS}
+   *
+   * @return selector, or null if the {@link DeferExpressionDimensions} determines we should not defer the expression
+   */
+  @Nullable
+  public static GroupByVectorColumnSelector makeGroupByVectorColumnSelector(
+      VectorColumnSelectorFactory factory,
+      Expr expression,
+      DeferExpressionDimensions deferExpressionDimensions
+  )
+  {
+    final ExpressionPlan plan = ExpressionPlanner.plan(factory, expression);
+    Preconditions.checkArgument(plan.is(ExpressionPlan.Trait.VECTORIZABLE));
+
+    final List<String> requiredBindings = plan.getAnalysis().getRequiredBindingsList();
+
+    if (!deferExpressionDimensions.useDeferredGroupBySelector(plan, requiredBindings, factory)) {
+      return null;
+    }
+
+    final RowSignature.Builder requiredBindingsSignatureBuilder = RowSignature.builder();
+    final List<GroupByVectorColumnSelector> subSelectors = new ArrayList<>();
+
+    for (final String columnName : requiredBindings) {
+      final ColumnCapabilities capabilities = factory.getColumnCapabilities(columnName);
+      final ColumnType columnType = capabilities != null ? capabilities.toColumnType() : ColumnType.STRING;
+      final GroupByVectorColumnSelector subSelector =
+          factory.makeGroupByVectorColumnSelector(columnName, deferExpressionDimensions);
+      requiredBindingsSignatureBuilder.add(columnName, columnType);
+      subSelectors.add(subSelector);
+    }
+
+    return new ExpressionDeferredGroupByVectorColumnSelector(
+        expression.asSingleThreaded(factory),
+        requiredBindingsSignatureBuilder.build(),
+        subSelectors
+    );
+  }
+
   public static VectorObjectSelector castValueSelectorToObject(
       ReadableVectorInspector inspector,
       String columnName,
diff --git a/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionVirtualColumn.java b/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionVirtualColumn.java
index 58952061239..42a723907b9 100644
--- a/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionVirtualColumn.java
+++ b/processing/src/main/java/org/apache/druid/segment/virtual/ExpressionVirtualColumn.java
@@ -35,6 +35,8 @@ import org.apache.druid.math.expr.Parser;
 import org.apache.druid.query.cache.CacheKeyBuilder;
 import org.apache.druid.query.dimension.DimensionSpec;
 import org.apache.druid.query.filter.ColumnIndexSelector;
+import org.apache.druid.query.groupby.DeferExpressionDimensions;
+import org.apache.druid.query.groupby.epinephelinae.vector.GroupByVectorColumnSelector;
 import org.apache.druid.segment.ColumnInspector;
 import org.apache.druid.segment.ColumnSelectorFactory;
 import org.apache.druid.segment.ColumnValueSelector;
@@ -242,6 +244,28 @@ public class ExpressionVirtualColumn implements VirtualColumn
     return ExpressionVectorSelectors.makeVectorObjectSelector(factory, parsedExpression.get());
   }
 
+  @Nullable
+  @Override
+  public GroupByVectorColumnSelector makeGroupByVectorColumnSelector(
+      String columnName,
+      VectorColumnSelectorFactory factory,
+      DeferExpressionDimensions deferExpressionDimensions
+  )
+  {
+    if (isDirectAccess(factory)) {
+      return factory.makeGroupByVectorColumnSelector(
+          parsedExpression.get().getBindingIfIdentifier(),
+          deferExpressionDimensions
+      );
+    }
+
+    return ExpressionVectorSelectors.makeGroupByVectorColumnSelector(
+        factory,
+        parsedExpression.get(),
+        deferExpressionDimensions
+    );
+  }
+
   @Nullable
   @Override
   public ColumnIndexSupplier getIndexSupplier(
diff --git a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryConfigTest.java b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryConfigTest.java
index 34ed99cda21..49b0b035f37 100644
--- a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryConfigTest.java
+++ b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryConfigTest.java
@@ -75,6 +75,7 @@ public class GroupByQueryConfigTest
     Assert.assertEquals(5, config2.getConfiguredMaxSelectorDictionarySize());
     Assert.assertEquals(6_000_000, config2.getConfiguredMaxMergingDictionarySize());
     Assert.assertEquals(7.0, config2.getBufferGrouperMaxLoadFactor(), 0.0);
+    Assert.assertEquals(DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC, config2.getDeferExpressionDimensions());
     Assert.assertFalse(config2.isApplyLimitPushDownToSegment());
   }
 
@@ -94,6 +95,10 @@ public class GroupByQueryConfigTest
                                     .put("maxSelectorDictionarySize", 3)
                                     .put("maxMergingDictionarySize", 4)
                                     .put("applyLimitPushDownToSegment", true)
+                                    .put(
+                                        GroupByQueryConfig.CTX_KEY_DEFER_EXPRESSION_DIMENSIONS,
+                                        DeferExpressionDimensions.ALWAYS.toString()
+                                    )
                                     .build()
                     )
                     .build()
@@ -105,6 +110,7 @@ public class GroupByQueryConfigTest
     Assert.assertEquals(3, config2.getConfiguredMaxSelectorDictionarySize());
     Assert.assertEquals(4, config2.getConfiguredMaxMergingDictionarySize());
     Assert.assertEquals(7.0, config2.getBufferGrouperMaxLoadFactor(), 0.0);
+    Assert.assertEquals(DeferExpressionDimensions.ALWAYS, config2.getDeferExpressionDimensions());
     Assert.assertTrue(config2.isApplyLimitPushDownToSegment());
   }
 
diff --git a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java
index 3613246fef6..d4dc8734130 100644
--- a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java
+++ b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java
@@ -9846,6 +9846,40 @@ public class GroupByQueryRunnerTest extends InitializedNullHandlingTest
     TestHelper.assertExpectedObjects(expectedResults, results, "cardinality-agg");
   }
 
+  @Test
+  public void testGroupByDimensionOnMultiStringExpression()
+  {
+    GroupByQuery query = makeQueryBuilder()
+        .setDataSource(QueryRunnerTestHelper.DATA_SOURCE)
+        .setQuerySegmentSpec(QueryRunnerTestHelper.FIRST_TO_THIRD)
+        .setVirtualColumns(
+            new ExpressionVirtualColumn("v0", "concat(quality,market)", ColumnType.STRING, TestExprMacroTable.INSTANCE)
+        )
+        .setDimensions(new DefaultDimensionSpec("v0", "d0"))
+        .setAggregatorSpecs(QueryRunnerTestHelper.ROWS_COUNT)
+        .setGranularity(QueryRunnerTestHelper.ALL_GRAN)
+        .build();
+
+    List<ResultRow> expectedResults = ImmutableList.of(
+        makeRow(query, "2011-04-01", "d0", "automotivespot", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "businessspot", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "entertainmentspot", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "healthspot", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "mezzaninespot", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "mezzaninetotal_market", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "mezzanineupfront", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "newsspot", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "premiumspot", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "premiumtotal_market", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "premiumupfront", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "technologyspot", "rows", 2L),
+        makeRow(query, "2011-04-01", "d0", "travelspot", "rows", 2L)
+    );
+
+    Iterable<ResultRow> results = GroupByQueryRunnerTestHelper.runQuery(factory, runner, query);
+    TestHelper.assertExpectedObjects(expectedResults, results, "cardinality-agg");
+  }
+
   @Test
   public void testGroupByCardinalityAggOnHyperUnique()
   {
diff --git a/processing/src/test/java/org/apache/druid/segment/virtual/ExpressionVectorSelectorsTest.java b/processing/src/test/java/org/apache/druid/segment/virtual/ExpressionVectorSelectorsTest.java
index cd8b78ed1f9..6d27439f8a6 100644
--- a/processing/src/test/java/org/apache/druid/segment/virtual/ExpressionVectorSelectorsTest.java
+++ b/processing/src/test/java/org/apache/druid/segment/virtual/ExpressionVectorSelectorsTest.java
@@ -20,6 +20,7 @@
 package org.apache.druid.segment.virtual;
 
 import com.google.common.collect.ImmutableList;
+import org.apache.datasketches.memory.WritableMemory;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.java.util.common.guava.Sequence;
 import org.apache.druid.java.util.common.io.Closer;
@@ -29,6 +30,10 @@ import org.apache.druid.math.expr.ExpressionType;
 import org.apache.druid.math.expr.Parser;
 import org.apache.druid.query.dimension.DefaultDimensionSpec;
 import org.apache.druid.query.expression.TestExprMacroTable;
+import org.apache.druid.query.groupby.DeferExpressionDimensions;
+import org.apache.druid.query.groupby.ResultRow;
+import org.apache.druid.query.groupby.epinephelinae.collection.MemoryPointer;
+import org.apache.druid.query.groupby.epinephelinae.vector.GroupByVectorColumnSelector;
 import org.apache.druid.segment.ColumnValueSelector;
 import org.apache.druid.segment.Cursor;
 import org.apache.druid.segment.DeprecatedQueryableIndexColumnSelector;
@@ -260,14 +265,17 @@ public class ExpressionVectorSelectorsTest extends InitializedNullHandlingTest
       } else {
         objectSelector = cursor.getColumnSelectorFactory().makeObjectSelector("v");
       }
+      GroupByVectorColumnSelector groupBySelector =
+          cursor.getColumnSelectorFactory().makeGroupByVectorColumnSelector("v", DeferExpressionDimensions.ALWAYS);
       while (!cursor.isDone()) {
+        final List<Object> resultsVector = new ArrayList<>();
         boolean[] nulls;
         switch (outputType.getType()) {
           case LONG:
             nulls = selector.getNullVector();
             long[] longs = selector.getLongVector();
             for (int i = 0; i < selector.getCurrentVectorSize(); i++, rowCount++) {
-              results.add(nulls != null && nulls[i] ? null : longs[i]);
+              resultsVector.add(nulls != null && nulls[i] ? null : longs[i]);
             }
             break;
           case DOUBLE:
@@ -276,24 +284,26 @@ public class ExpressionVectorSelectorsTest extends InitializedNullHandlingTest
               nulls = selector.getNullVector();
               float[] floats = selector.getFloatVector();
               for (int i = 0; i < selector.getCurrentVectorSize(); i++, rowCount++) {
-                results.add(nulls != null && nulls[i] ? null : (double) floats[i]);
+                resultsVector.add(nulls != null && nulls[i] ? null : (double) floats[i]);
               }
             } else {
               nulls = selector.getNullVector();
               double[] doubles = selector.getDoubleVector();
               for (int i = 0; i < selector.getCurrentVectorSize(); i++, rowCount++) {
-                results.add(nulls != null && nulls[i] ? null : doubles[i]);
+                resultsVector.add(nulls != null && nulls[i] ? null : doubles[i]);
               }
             }
             break;
           case STRING:
             Object[] objects = objectSelector.getObjectVector();
             for (int i = 0; i < objectSelector.getCurrentVectorSize(); i++, rowCount++) {
-              results.add(objects[i]);
+              resultsVector.add(objects[i]);
             }
             break;
         }
 
+        verifyGroupBySelector(groupBySelector, resultsVector);
+        results.addAll(resultsVector);
         cursor.advance();
       }
     }
@@ -328,4 +338,24 @@ public class ExpressionVectorSelectorsTest extends InitializedNullHandlingTest
     Assert.assertTrue(rowCountCursor > 0);
     Assert.assertEquals(rowCountCursor, rowCount);
   }
+
+  private static void verifyGroupBySelector(
+      final GroupByVectorColumnSelector groupBySelector,
+      final List<Object> expectedResults
+  )
+  {
+    final int keyOffset = 1;
+    final int keySize = groupBySelector.getGroupingKeySize() + keyOffset + 1; // 1 byte before, 1 byte after
+    final WritableMemory keySpace =
+        WritableMemory.allocate(keySize * expectedResults.size());
+
+    final int writeKeysRetVal = groupBySelector.writeKeys(keySpace, keySize, keyOffset, 0, expectedResults.size());
+    Assert.assertEquals(0, writeKeysRetVal);
+
+    for (int i = 0; i < expectedResults.size(); i++) {
+      final ResultRow resultRow = ResultRow.create(1);
+      groupBySelector.writeKeyToResultRow(new MemoryPointer(keySpace, (long) keySize * i), keyOffset, resultRow, 0);
+      Assert.assertEquals("row #" + i, expectedResults.get(i), resultRow.getArray()[0]);
+    }
+  }
 }

From 920d9020c047710f105f99410f9498e3604d6979 Mon Sep 17 00:00:00 2001
From: Hugh Evans <101668034+hevansDev@users.noreply.github.com>
Date: Thu, 27 Jun 2024 02:31:56 +0100
Subject: [PATCH 31/72] Docs: Fix default value for
 globalIngestionHeapLimitBytes (#16654)

Use the new default value added in #8255
---
 docs/configuration/index.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/configuration/index.md b/docs/configuration/index.md
index b62ab9c0db8..c627e9fd7f0 100644
--- a/docs/configuration/index.md
+++ b/docs/configuration/index.md
@@ -1560,7 +1560,7 @@ For most types of tasks, `SegmentWriteOutMediumFactory` can be configured per-ta
 |`druid.worker.capacity`|Maximum number of tasks the Indexer can accept.|Number of available processors - 1|
 |`druid.worker.baseTaskDirs`|List of base temporary working directories, one of which is assigned per task in a round-robin fashion. This property can be used to allow usage of multiple disks for indexing. This property is recommended in place of and takes precedence over `${druid.indexer.task.baseTaskDir}`.  If this configuration is not set, `${druid.indexer.task.baseTaskDir}` is used. Example: `druid.worker.baseTaskDirs=[\"PATH1\",\"PATH2\",...]`.|null|
 |`druid.worker.baseTaskDirSize`|The total amount of bytes that can be used by tasks on any single task dir. This value is treated symmetrically across all directories, that is, if this is 500 GB and there are 3 `baseTaskDirs`, then each of those task directories is assumed to allow for 500 GB to be used and a total of 1.5 TB will potentially be available across all tasks. The actual amount of memory assigned to each task is discussed in [Configuring task storage sizes](../ingestion/tasks.md#configuring-task-storage-sizes)|`Long.MAX_VALUE`|
-|`druid.worker.globalIngestionHeapLimitBytes`|Total amount of heap available for ingestion processing. This is applied by automatically setting the `maxBytesInMemory` property on tasks.|60% of configured JVM heap|
+|`druid.worker.globalIngestionHeapLimitBytes`|Total amount of heap available for ingestion processing. This is applied by automatically setting the `maxBytesInMemory` property on tasks.|Configured max JVM heap size / 6|
 |`druid.worker.numConcurrentMerges`|Maximum number of segment persist or merge operations that can run concurrently across all tasks.|`druid.worker.capacity` / 2, rounded down|
 |`druid.indexer.task.baseDir`|Base temporary working directory.|`System.getProperty("java.io.tmpdir")`|
 |`druid.indexer.task.baseTaskDir`|Base temporary working directory for tasks.|`${druid.indexer.task.baseDir}/persistent/tasks`|

From f51c7b346fba2d189179ef183148c34452ba1188 Mon Sep 17 00:00:00 2001
From: Rishabh Singh <6513075+findingrish@users.noreply.github.com>
Date: Thu, 27 Jun 2024 14:41:58 +0530
Subject: [PATCH 32/72] Add druid parquet extensions to example quickstarts
 (#16664)

This change adds druid-parquet-extensions to all example quickstarts
---
 examples/conf/druid/auto/_common/common.runtime.properties      | 2 +-
 examples/conf/druid/cluster/_common/common.runtime.properties   | 2 +-
 .../druid/single-server/large/_common/common.runtime.properties | 2 +-
 .../single-server/medium/_common/common.runtime.properties      | 2 +-
 .../micro-quickstart/_common/common.runtime.properties          | 2 +-
 .../nano-quickstart/_common/common.runtime.properties           | 2 +-
 .../druid/single-server/small/_common/common.runtime.properties | 2 +-
 .../single-server/xlarge/_common/common.runtime.properties      | 2 +-
 8 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/examples/conf/druid/auto/_common/common.runtime.properties b/examples/conf/druid/auto/_common/common.runtime.properties
index 8a9058f6b8c..985a84994d1 100644
--- a/examples/conf/druid/auto/_common/common.runtime.properties
+++ b/examples/conf/druid/auto/_common/common.runtime.properties
@@ -24,7 +24,7 @@
 # If you specify `druid.extensions.loadList=[]`, Druid won't load any extension from file system.
 # If you don't specify `druid.extensions.loadList`, Druid will load all the extensions under root extension directory.
 # More info: https://druid.apache.org/docs/latest/operations/including-extensions.html
-druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query"]
+druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query", "druid-parquet-extensions"]
 
 # If you have a different version of Hadoop, place your Hadoop client jar files in your hadoop-dependencies directory
 # and uncomment the line below to point to your directory.
diff --git a/examples/conf/druid/cluster/_common/common.runtime.properties b/examples/conf/druid/cluster/_common/common.runtime.properties
index 8a9058f6b8c..985a84994d1 100644
--- a/examples/conf/druid/cluster/_common/common.runtime.properties
+++ b/examples/conf/druid/cluster/_common/common.runtime.properties
@@ -24,7 +24,7 @@
 # If you specify `druid.extensions.loadList=[]`, Druid won't load any extension from file system.
 # If you don't specify `druid.extensions.loadList`, Druid will load all the extensions under root extension directory.
 # More info: https://druid.apache.org/docs/latest/operations/including-extensions.html
-druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query"]
+druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query", "druid-parquet-extensions"]
 
 # If you have a different version of Hadoop, place your Hadoop client jar files in your hadoop-dependencies directory
 # and uncomment the line below to point to your directory.
diff --git a/examples/conf/druid/single-server/large/_common/common.runtime.properties b/examples/conf/druid/single-server/large/_common/common.runtime.properties
index dcb1687ca70..d27c83ca569 100644
--- a/examples/conf/druid/single-server/large/_common/common.runtime.properties
+++ b/examples/conf/druid/single-server/large/_common/common.runtime.properties
@@ -24,7 +24,7 @@
 # If you specify `druid.extensions.loadList=[]`, Druid won't load any extension from file system.
 # If you don't specify `druid.extensions.loadList`, Druid will load all the extensions under root extension directory.
 # More info: https://druid.apache.org/docs/latest/operations/including-extensions.html
-druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query"]
+druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query", "druid-parquet-extensions"]
 
 # If you have a different version of Hadoop, place your Hadoop client jar files in your hadoop-dependencies directory
 # and uncomment the line below to point to your directory.
diff --git a/examples/conf/druid/single-server/medium/_common/common.runtime.properties b/examples/conf/druid/single-server/medium/_common/common.runtime.properties
index dcb1687ca70..d27c83ca569 100644
--- a/examples/conf/druid/single-server/medium/_common/common.runtime.properties
+++ b/examples/conf/druid/single-server/medium/_common/common.runtime.properties
@@ -24,7 +24,7 @@
 # If you specify `druid.extensions.loadList=[]`, Druid won't load any extension from file system.
 # If you don't specify `druid.extensions.loadList`, Druid will load all the extensions under root extension directory.
 # More info: https://druid.apache.org/docs/latest/operations/including-extensions.html
-druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query"]
+druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query", "druid-parquet-extensions"]
 
 # If you have a different version of Hadoop, place your Hadoop client jar files in your hadoop-dependencies directory
 # and uncomment the line below to point to your directory.
diff --git a/examples/conf/druid/single-server/micro-quickstart/_common/common.runtime.properties b/examples/conf/druid/single-server/micro-quickstart/_common/common.runtime.properties
index dcb1687ca70..d27c83ca569 100644
--- a/examples/conf/druid/single-server/micro-quickstart/_common/common.runtime.properties
+++ b/examples/conf/druid/single-server/micro-quickstart/_common/common.runtime.properties
@@ -24,7 +24,7 @@
 # If you specify `druid.extensions.loadList=[]`, Druid won't load any extension from file system.
 # If you don't specify `druid.extensions.loadList`, Druid will load all the extensions under root extension directory.
 # More info: https://druid.apache.org/docs/latest/operations/including-extensions.html
-druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query"]
+druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query", "druid-parquet-extensions"]
 
 # If you have a different version of Hadoop, place your Hadoop client jar files in your hadoop-dependencies directory
 # and uncomment the line below to point to your directory.
diff --git a/examples/conf/druid/single-server/nano-quickstart/_common/common.runtime.properties b/examples/conf/druid/single-server/nano-quickstart/_common/common.runtime.properties
index dcb1687ca70..d27c83ca569 100644
--- a/examples/conf/druid/single-server/nano-quickstart/_common/common.runtime.properties
+++ b/examples/conf/druid/single-server/nano-quickstart/_common/common.runtime.properties
@@ -24,7 +24,7 @@
 # If you specify `druid.extensions.loadList=[]`, Druid won't load any extension from file system.
 # If you don't specify `druid.extensions.loadList`, Druid will load all the extensions under root extension directory.
 # More info: https://druid.apache.org/docs/latest/operations/including-extensions.html
-druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query"]
+druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query", "druid-parquet-extensions"]
 
 # If you have a different version of Hadoop, place your Hadoop client jar files in your hadoop-dependencies directory
 # and uncomment the line below to point to your directory.
diff --git a/examples/conf/druid/single-server/small/_common/common.runtime.properties b/examples/conf/druid/single-server/small/_common/common.runtime.properties
index dcb1687ca70..d27c83ca569 100644
--- a/examples/conf/druid/single-server/small/_common/common.runtime.properties
+++ b/examples/conf/druid/single-server/small/_common/common.runtime.properties
@@ -24,7 +24,7 @@
 # If you specify `druid.extensions.loadList=[]`, Druid won't load any extension from file system.
 # If you don't specify `druid.extensions.loadList`, Druid will load all the extensions under root extension directory.
 # More info: https://druid.apache.org/docs/latest/operations/including-extensions.html
-druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query"]
+druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query", "druid-parquet-extensions"]
 
 # If you have a different version of Hadoop, place your Hadoop client jar files in your hadoop-dependencies directory
 # and uncomment the line below to point to your directory.
diff --git a/examples/conf/druid/single-server/xlarge/_common/common.runtime.properties b/examples/conf/druid/single-server/xlarge/_common/common.runtime.properties
index dcb1687ca70..d27c83ca569 100644
--- a/examples/conf/druid/single-server/xlarge/_common/common.runtime.properties
+++ b/examples/conf/druid/single-server/xlarge/_common/common.runtime.properties
@@ -24,7 +24,7 @@
 # If you specify `druid.extensions.loadList=[]`, Druid won't load any extension from file system.
 # If you don't specify `druid.extensions.loadList`, Druid will load all the extensions under root extension directory.
 # More info: https://druid.apache.org/docs/latest/operations/including-extensions.html
-druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query"]
+druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query", "druid-parquet-extensions"]
 
 # If you have a different version of Hadoop, place your Hadoop client jar files in your hadoop-dependencies directory
 # and uncomment the line below to point to your directory.

From 4401c9d13867e1b1a5093a94388a27fa1d295d33 Mon Sep 17 00:00:00 2001
From: 317brian <53799971+317brian@users.noreply.github.com>
Date: Thu, 27 Jun 2024 10:56:51 -0700
Subject: [PATCH 33/72] docs: add redirect for kafka lookups (#16668)

---
 website/redirects.js | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/website/redirects.js b/website/redirects.js
index 31f93107ce4..4eb2a36c33b 100644
--- a/website/redirects.js
+++ b/website/redirects.js
@@ -20,6 +20,10 @@
 
 
 const Redirects=[
+  {
+    "from": "/docs/latest/development/extensions-core/kafka-extraction-namespace/",
+    "to": "/docs/latest/querying/kafka-extraction-namespace"
+  },
   {
     "from": [
       "/docs/latest/configuration/auth.html",

From d86f25c74ade07c12f26fcd99f4393f2093f4de3 Mon Sep 17 00:00:00 2001
From: Clint Wylie <cwylie@apache.org>
Date: Thu, 27 Jun 2024 16:19:16 -0700
Subject: [PATCH 34/72] fix vector grouping expression deferred evaluation to
 only consider dictionary encoded strings as fixed width (#16666)

---
 .../groupby/DeferExpressionDimensions.java    |  23 +-
 .../virtual/ExpressionPlannerTest.java        | 481 ++++++++++++++++++
 2 files changed, 502 insertions(+), 2 deletions(-)

diff --git a/processing/src/main/java/org/apache/druid/query/groupby/DeferExpressionDimensions.java b/processing/src/main/java/org/apache/druid/query/groupby/DeferExpressionDimensions.java
index 3c6621d9038..9f6a88f08b2 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/DeferExpressionDimensions.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/DeferExpressionDimensions.java
@@ -71,7 +71,7 @@ public enum DeferExpressionDimensions
           return false;
         }
 
-        if (!capabilities.isNumeric() && !capabilities.isDictionaryEncoded().isTrue()) {
+        if (!capabilities.isNumeric() && !isDictionaryEncodedScalarString(capabilities)) {
           // Not fixed-width.
           return false;
         }
@@ -106,7 +106,7 @@ public enum DeferExpressionDimensions
 
         allNumericInputs = allNumericInputs && capabilities.isNumeric();
 
-        if (!capabilities.isNumeric() && !capabilities.isDictionaryEncoded().isTrue()) {
+        if (!capabilities.isNumeric() && !isDictionaryEncodedScalarString(capabilities)) {
           // Not fixed-width.
           return false;
         }
@@ -162,6 +162,25 @@ public enum DeferExpressionDimensions
     return jsonName;
   }
 
+
+  /**
+   * {@link VectorColumnSelectorFactory} currently can only make dictionary encoded selectors for string types, so
+   * we can only consider them as fixed width. Additionally, to err on the side of safety, multi-value string columns
+   * are also not considered fixed width because expressions process multi-value dimensions as single rows, so we would
+   * need all dictionary ids to be present in the combined key.
+   *
+   * At the time of this javadoc, vector group by does not support multi-value dimensions anyway, so this isn't really
+   * a problem, but if it did, we could consider allowing them if we ensure that all multi-value inputs are used as
+   * scalars and so the expression can be applied separately to each individual dictionary id (e.g. the equivalent of
+   * {@link ExpressionPlan.Trait#SINGLE_INPUT_MAPPABLE} but for all multi-value string inputs of the expression).
+   */
+  private static boolean isDictionaryEncodedScalarString(ColumnCapabilities capabilities)
+  {
+    return capabilities.isDictionaryEncoded().isTrue() &&
+           capabilities.is(ValueType.STRING) &&
+           capabilities.hasMultipleValues().isFalse();
+  }
+
   /**
    * Whether the given expression can be deferred innately by the selector created by
    * {@link ExpressionVirtualColumn#makeSingleValueVectorDimensionSelector(DimensionSpec, VectorColumnSelectorFactory)}.
diff --git a/processing/src/test/java/org/apache/druid/segment/virtual/ExpressionPlannerTest.java b/processing/src/test/java/org/apache/druid/segment/virtual/ExpressionPlannerTest.java
index 9b4d1b84af2..fcae823b626 100644
--- a/processing/src/test/java/org/apache/druid/segment/virtual/ExpressionPlannerTest.java
+++ b/processing/src/test/java/org/apache/druid/segment/virtual/ExpressionPlannerTest.java
@@ -29,6 +29,7 @@ import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.math.expr.ExpressionType;
 import org.apache.druid.math.expr.Parser;
 import org.apache.druid.query.expression.TestExprMacroTable;
+import org.apache.druid.query.groupby.DeferExpressionDimensions;
 import org.apache.druid.segment.ColumnInspector;
 import org.apache.druid.segment.column.ColumnCapabilities;
 import org.apache.druid.segment.column.ColumnCapabilitiesImpl;
@@ -234,6 +235,28 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     Assert.assertNull(thePlan.getOutputType());
     Assert.assertNull(thePlan.inferColumnCapabilities(null));
     // no we cannot
+
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
   @Test
@@ -269,6 +292,28 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     Assert.assertFalse(inferred.hasMultipleValues().isMaybeTrue());
     Assert.assertFalse(inferred.hasBitmapIndexes());
     Assert.assertFalse(inferred.hasSpatialIndexes());
+
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
   @Test
@@ -348,6 +393,27 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     Assert.assertFalse(inferred.hasMultipleValues().isMaybeTrue());
     Assert.assertFalse(inferred.hasBitmapIndexes());
     Assert.assertFalse(inferred.hasSpatialIndexes());
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertTrue(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
   @Test
@@ -387,6 +453,30 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     Assert.assertTrue(inferred.hasBitmapIndexes());
     Assert.assertFalse(inferred.hasSpatialIndexes());
 
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    // innately deferrable
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+
+
     // multiple input columns
     thePlan = plan("concat(scalar_dictionary_string, scalar_dictionary_string_nonunique)");
     Assert.assertTrue(
@@ -430,6 +520,29 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     Assert.assertFalse(inferred.hasBitmapIndexes());
     Assert.assertFalse(inferred.hasSpatialIndexes());
 
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertTrue(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertTrue(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+
+
     // array output of dictionary encoded string are not considered single scalar/mappable, nor vectorizable
     thePlan = plan("array(scalar_dictionary_string)");
     Assert.assertTrue(
@@ -448,6 +561,27 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
             ExpressionPlan.Trait.VECTORIZABLE
         )
     );
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertTrue(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertTrue(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
   @Test
@@ -481,6 +615,29 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     Assert.assertTrue(inferred.hasBitmapIndexes());
     Assert.assertFalse(inferred.hasSpatialIndexes());
 
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+
+
     thePlan = plan("concat(scalar_string, multi_dictionary_string_nonunique)");
     Assert.assertTrue(
         thePlan.is(
@@ -510,6 +667,28 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     Assert.assertEquals(ValueType.STRING, inferred.getType());
     Assert.assertTrue(inferred.hasMultipleValues().isTrue());
 
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+
     thePlan = plan("concat(multi_dictionary_string, multi_dictionary_string_nonunique)");
     Assert.assertTrue(
         thePlan.is(
@@ -541,6 +720,28 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     Assert.assertEquals(ValueType.STRING, inferred.getType());
     Assert.assertTrue(inferred.hasMultipleValues().isTrue());
 
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+
     thePlan = plan("array_append(multi_dictionary_string, 'foo')");
     Assert.assertTrue(
         thePlan.is(
@@ -556,6 +757,27 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
             ExpressionPlan.Trait.VECTORIZABLE
         )
     );
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
   @Test
@@ -582,6 +804,27 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
         )
     );
     Assert.assertEquals(ExpressionType.STRING, thePlan.getOutputType());
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
 
     thePlan = plan("concat(multi_dictionary_string, multi_dictionary_string_nonunique)");
     Assert.assertTrue(
@@ -631,6 +874,28 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     // incomplete and unknown skip output type since we don't reliably know
     Assert.assertNull(thePlan.getOutputType());
     Assert.assertNull(thePlan.inferColumnCapabilities(null));
+
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
   @Test
@@ -667,14 +932,78 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     Assert.assertEquals("array_append(\"scalar_string\", 'x')", thePlan.getAppliedFoldExpression("__acc").stringify());
     Assert.assertEquals(ExpressionType.STRING_ARRAY, thePlan.getOutputType());
 
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+
     // multi-valued are cool too
     thePlan = plan("array_append(multi_dictionary_string, 'x')");
     assertArrayInAndOut(thePlan);
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
 
     // what about incomplete inputs with arrays? they are not reported as incomplete because they are treated as arrays
     thePlan = plan("array_append(string_unknown, 'x')");
     assertArrayInAndOut(thePlan);
     Assert.assertEquals(ExpressionType.STRING_ARRAY, thePlan.getOutputType());
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
 
     // what about if it is the scalar argument? there it is
     thePlan = plan("array_append(multi_dictionary_string, string_unknown)");
@@ -696,13 +1025,76 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     );
     // incomplete and unknown skip output type since we don't reliably know
     Assert.assertNull(thePlan.getOutputType());
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
 
     // array types are cool too
     thePlan = plan("array_append(string_array_1, 'x')");
     assertArrayInAndOut(thePlan);
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
 
     thePlan = plan("array_append(string_array_1, 'x')");
     assertArrayInAndOut(thePlan);
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
 
@@ -732,6 +1124,28 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     );
     Assert.assertEquals(ExpressionType.STRING, thePlan.getOutputType());
 
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+
     // what about a multi-valued input
     thePlan = plan("array_to_string(array_append(scalar_string, multi_dictionary_string), ',')");
     Assert.assertTrue(
@@ -761,6 +1175,28 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
     );
     // why is this null
     Assert.assertEquals(ExpressionType.STRING, thePlan.getOutputType());
+
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
   @Test
@@ -864,6 +1300,29 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
         ColumnType.NESTED_DATA.getComplexTypeName(),
         inferred.getComplexTypeName()
     );
+
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    // all numeric inputs so these are true
+    Assert.assertTrue(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertTrue(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
   @Test
@@ -895,6 +1354,28 @@ public class ExpressionPlannerTest extends InitializedNullHandlingTest
         inferred.getType()
     );
     Assert.assertFalse(inferred.isDictionaryEncoded().isMaybeTrue());
+
+    Assert.assertFalse(
+        DeferExpressionDimensions.SINGLE_STRING.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH_NON_NUMERIC.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
+    Assert.assertFalse(
+        DeferExpressionDimensions.FIXED_WIDTH.useDeferredGroupBySelector(
+            thePlan,
+            thePlan.getAnalysis().getRequiredBindingsList(),
+            SYNTHETIC_INSPECTOR
+        )
+    );
   }
 
   private static ExpressionPlan plan(String expression)

From 45c020060c7ed6a6dcf96bf6ce9a6873834a38a3 Mon Sep 17 00:00:00 2001
From: Clint Wylie <cwylie@apache.org>
Date: Thu, 27 Jun 2024 17:53:20 -0700
Subject: [PATCH 35/72] better javadoc for ColumnIndexSupplier (#16663)

Updated javadoc for `ColumnIndexSupplier.as` to elaborate on the types of indexes callers might want to ask for from the method, as well as help implementors know what kinds of indexes they should implement to participate in filtering
---
 .../segment/column/ColumnIndexSupplier.java   | 33 +++++++++++++++++++
 1 file changed, 33 insertions(+)

diff --git a/processing/src/main/java/org/apache/druid/segment/column/ColumnIndexSupplier.java b/processing/src/main/java/org/apache/druid/segment/column/ColumnIndexSupplier.java
index 7e2b21a25d0..73a235ce8ef 100644
--- a/processing/src/main/java/org/apache/druid/segment/column/ColumnIndexSupplier.java
+++ b/processing/src/main/java/org/apache/druid/segment/column/ColumnIndexSupplier.java
@@ -19,6 +19,8 @@
 
 package org.apache.druid.segment.column;
 
+import org.apache.druid.query.filter.ColumnIndexSelector;
+
 import javax.annotation.Nullable;
 
 /**
@@ -41,6 +43,37 @@ public interface ColumnIndexSupplier
    * which can greatly reduce the total number of rows which need to be scanned and processed.
    *
    * Objects returned by this method are not thread-safe.
+   *
+   * There are several built-in index classes which can be passed as an argument to this method when used from
+   * {@link org.apache.druid.query.filter.Filter#getBitmapColumnIndex(ColumnIndexSelector)}. Implementors of this
+   * interface should provide as many of them as possible to participate fully in as many
+   * {@link org.apache.druid.query.filter.Filter} as possible, as different filters require different index types,
+   * and may prefer some over others.
+   *
+   * Indexes for matching a row to a specific value:
+   * @see org.apache.druid.segment.index.semantic.NullValueIndex
+   * @see org.apache.druid.segment.index.semantic.ValueIndexes
+   *
+   * Indexes for matching a row to any of a set of values:
+   * @see org.apache.druid.segment.index.semantic.ValueSetIndexes
+   * @see org.apache.druid.segment.index.semantic.Utf8ValueSetIndexes
+   *
+   * Indexes for matching a row to a range of values:
+   * @see org.apache.druid.segment.index.semantic.LexicographicalRangeIndexes
+   * @see org.apache.druid.segment.index.semantic.NumericRangeIndexes
+   *
+   * Indexes for matching an array element of a row to a specific value:
+   * @see org.apache.druid.segment.index.semantic.ArrayElementIndexes
+   *
+   * Indexes for matching a row using a {@link org.apache.druid.query.filter.DruidPredicateFactory}:
+   * @see org.apache.druid.segment.index.semantic.DruidPredicateIndexes
+   *
+   * Speciality indexes:
+   * @see org.apache.druid.segment.index.semantic.SpatialIndex
+   *
+   * Low level access to implementation specific index stuff not particularly suitable for use in filtering:
+   * @see org.apache.druid.segment.index.semantic.DictionaryEncodedValueIndex
+   * @see org.apache.druid.segment.index.semantic.DictionaryEncodedStringValueIndex
    */
   @Nullable
   <T> T as(Class<T> clazz);

From b9c7664ac34f695e78e9fbbcd54e729df93a6668 Mon Sep 17 00:00:00 2001
From: Rishabh Singh <6513075+findingrish@users.noreply.github.com>
Date: Fri, 28 Jun 2024 11:06:56 +0530
Subject: [PATCH 36/72] Fix empty datasource schema on the Broker when metadata
 query is disabled (#16645)

* Fix build

* Fix empty datasource schema on the broker

* review comment

* Remove unused import
---
 ...-compose.centralized-datasource-schema.yml |  2 +-
 .../druid/testing/utils/DataLoaderHelper.java |  4 ++++
 .../testing/utils/SqlTestQueryHelper.java     | 23 ++++++++++++++++++
 .../schema/BrokerSegmentMetadataCache.java    | 10 ++++++++
 .../BrokerSegmentMetadataCacheTest.java       | 24 +++++++++++++++++++
 5 files changed, 62 insertions(+), 1 deletion(-)

diff --git a/integration-tests/docker/docker-compose.centralized-datasource-schema.yml b/integration-tests/docker/docker-compose.centralized-datasource-schema.yml
index 39ce98b1302..e89e49bc132 100644
--- a/integration-tests/docker/docker-compose.centralized-datasource-schema.yml
+++ b/integration-tests/docker/docker-compose.centralized-datasource-schema.yml
@@ -81,7 +81,7 @@ services:
       service: druid-broker
     environment:
       - DRUID_INTEGRATION_TEST_GROUP=${DRUID_INTEGRATION_TEST_GROUP}
-      - druid_sql_planner_metadataRefreshPeriod=PT20S
+      - druid_sql_planner_metadataRefreshPeriod=PT30S
       - druid_sql_planner_disableSegmentMetadataQueries=true
     depends_on:
       - druid-coordinator
diff --git a/integration-tests/src/main/java/org/apache/druid/testing/utils/DataLoaderHelper.java b/integration-tests/src/main/java/org/apache/druid/testing/utils/DataLoaderHelper.java
index 692ab962e62..67317f3e911 100644
--- a/integration-tests/src/main/java/org/apache/druid/testing/utils/DataLoaderHelper.java
+++ b/integration-tests/src/main/java/org/apache/druid/testing/utils/DataLoaderHelper.java
@@ -23,6 +23,7 @@ import com.google.inject.Inject;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.testing.clients.CoordinatorResourceTestClient;
+import org.testng.Assert;
 
 public final class DataLoaderHelper
 {
@@ -50,6 +51,9 @@ public final class DataLoaderHelper
         () -> sqlTestQueryHelper.isDatasourceLoadedInSQL(datasource),
         StringUtils.format("Waiting for [%s] to be ready for SQL queries", datasource)
     );
+
+    Assert.assertTrue(sqlTestQueryHelper.verifyTimeColumnIsPresent(datasource));
+
     LOG.info("Datasource [%s] ready for SQL queries", datasource);
   }
 }
diff --git a/integration-tests/src/main/java/org/apache/druid/testing/utils/SqlTestQueryHelper.java b/integration-tests/src/main/java/org/apache/druid/testing/utils/SqlTestQueryHelper.java
index 962b4a103d0..06a1f680b70 100644
--- a/integration-tests/src/main/java/org/apache/druid/testing/utils/SqlTestQueryHelper.java
+++ b/integration-tests/src/main/java/org/apache/druid/testing/utils/SqlTestQueryHelper.java
@@ -69,4 +69,27 @@ public class SqlTestQueryHelper extends AbstractTestQueryHelper<SqlQueryWithResu
       return false;
     }
   }
+
+  public boolean verifyTimeColumnIsPresent(String datasource)
+  {
+    final SqlQuery query = new SqlQuery(
+        "SELECT __time FROM \"" + datasource + "\" LIMIT 1",
+        null,
+        false,
+        false,
+        false,
+        null,
+        null
+    );
+
+    try {
+      //noinspection unchecked
+      queryClient.query(getQueryURL(broker), query);
+      return true;
+    }
+    catch (Exception e) {
+      LOG.debug(e, "Check query failed");
+      return false;
+    }
+  }
 }
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCache.java b/sql/src/main/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCache.java
index 0573d8d49ee..7974ed460eb 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCache.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCache.java
@@ -246,6 +246,16 @@ public class BrokerSegmentMetadataCache extends AbstractSegmentMetadataCache<Phy
         continue;
       }
 
+      if (rowSignature.getColumnNames().isEmpty()) {
+        // this case could arise when metadata refresh is disabled on broker
+        // and a new datasource is added
+        log.info("datasource [%s] schema has not been initialized yet, "
+                 + "check coordinator logs if this message is persistent.", dataSource);
+        // this is a harmless call
+        tables.remove(dataSource);
+        continue;
+      }
+
       final PhysicalDatasourceMetadata physicalDatasourceMetadata = dataSourceMetadataFactory.build(dataSource, rowSignature);
       updateDSMetadata(dataSource, physicalDatasourceMetadata);
     }
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCacheTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCacheTest.java
index f8660b63494..23b2759286c 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCacheTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCacheTest.java
@@ -1027,4 +1027,28 @@ public class BrokerSegmentMetadataCacheTest extends BrokerSegmentMetadataCacheTe
     buildSchemaMarkAndTableLatch();
     serverView.invokeSegmentSchemasAnnouncedDummy();
   }
+
+  @Test
+  public void testNoDatasourceSchemaWhenNoSegmentMetadata() throws InterruptedException, IOException
+  {
+    BrokerSegmentMetadataCacheConfig config = new BrokerSegmentMetadataCacheConfig();
+    config.setDisableSegmentMetadataQueries(true);
+
+    BrokerSegmentMetadataCache schema = buildSchemaMarkAndTableLatch(
+        config,
+        new NoopCoordinatorClient()
+    );
+
+    schema.start();
+    schema.awaitInitialization();
+
+    List<DataSegment> segments = schema.getSegmentMetadataSnapshot().values()
+                                .stream()
+                                .map(AvailableSegmentMetadata::getSegment)
+                                .collect(Collectors.toList());
+
+    schema.refresh(segments.stream().map(DataSegment::getId).collect(Collectors.toSet()), Collections.singleton("foo"));
+
+    Assert.assertNull(schema.getDatasource("foo"));
+  }
 }

From c96e783750b53985f01a8555e971a5290a720ebe Mon Sep 17 00:00:00 2001
From: Rishabh Singh <6513075+findingrish@users.noreply.github.com>
Date: Fri, 28 Jun 2024 11:07:28 +0530
Subject: [PATCH 37/72] Fix schema backfill count metric (#16536)

* Fix build

* Fix backfill metric

* Address review comment
---
 .../metadata/SqlSegmentsMetadataManager.java  |  1 -
 .../metadata/SegmentSchemaBackFillQueue.java  |  1 -
 .../segment/metadata/SegmentSchemaCache.java  | 21 ++++++++-----
 .../metadata/SegmentSchemaCacheTest.java      | 30 +++++++++++++++++--
 4 files changed, 40 insertions(+), 13 deletions(-)

diff --git a/server/src/main/java/org/apache/druid/metadata/SqlSegmentsMetadataManager.java b/server/src/main/java/org/apache/druid/metadata/SqlSegmentsMetadataManager.java
index 209deb41e7e..2c81603e529 100644
--- a/server/src/main/java/org/apache/druid/metadata/SqlSegmentsMetadataManager.java
+++ b/server/src/main/java/org/apache/druid/metadata/SqlSegmentsMetadataManager.java
@@ -1153,7 +1153,6 @@ public class SqlSegmentsMetadataManager implements SegmentsMetadataManager
                   return null;
                 }).list();
 
-          segmentSchemaCache.resetTemporaryPublishedMetadataQueryResultOnDBPoll();
           return null;
         });
 
diff --git a/server/src/main/java/org/apache/druid/segment/metadata/SegmentSchemaBackFillQueue.java b/server/src/main/java/org/apache/druid/segment/metadata/SegmentSchemaBackFillQueue.java
index 7855e11da37..4e5b9815ced 100644
--- a/server/src/main/java/org/apache/druid/segment/metadata/SegmentSchemaBackFillQueue.java
+++ b/server/src/main/java/org/apache/druid/segment/metadata/SegmentSchemaBackFillQueue.java
@@ -179,7 +179,6 @@ public class SegmentSchemaBackFillQueue
             entry.getValue(),
             CentralizedDatasourceSchemaConfig.SCHEMA_VERSION
         );
-
         // Mark the segments as published in the cache.
         for (SegmentSchemaMetadataPlus plus : entry.getValue()) {
           segmentSchemaCache.markMetadataQueryResultPublished(plus.getSegmentId());
diff --git a/server/src/main/java/org/apache/druid/segment/metadata/SegmentSchemaCache.java b/server/src/main/java/org/apache/druid/segment/metadata/SegmentSchemaCache.java
index c28e2b693bb..3364a3beb7c 100644
--- a/server/src/main/java/org/apache/druid/segment/metadata/SegmentSchemaCache.java
+++ b/server/src/main/java/org/apache/druid/segment/metadata/SegmentSchemaCache.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.segment.metadata;
 
+import com.google.common.annotations.VisibleForTesting;
 import com.google.common.collect.ImmutableMap;
 import com.google.inject.Inject;
 import org.apache.druid.guice.LazySingleton;
@@ -145,6 +146,12 @@ public class SegmentSchemaCache
   public void updateFinalizedSegmentSchema(FinalizedSegmentSchemaInfo finalizedSegmentSchemaInfo)
   {
     this.finalizedSegmentSchemaInfo = finalizedSegmentSchemaInfo;
+
+    // remove metadata for segments which have been polled in the last database poll
+    temporaryPublishedMetadataQueryResults
+        .keySet()
+        .removeAll(finalizedSegmentSchemaInfo.getFinalizedSegmentMetadata().keySet());
+
     setInitialized();
   }
 
@@ -185,14 +192,6 @@ public class SegmentSchemaCache
     temporaryMetadataQueryResults.remove(segmentId);
   }
 
-  /**
-   * temporaryPublishedMetadataQueryResults is reset after each DB poll.
-   */
-  public void resetTemporaryPublishedMetadataQueryResultOnDBPoll()
-  {
-    temporaryPublishedMetadataQueryResults.clear();
-  }
-
   /**
    * Fetch schema for a given segment. Note, that there is no check on schema version in this method,
    * since schema corresponding to a particular version {@link CentralizedDatasourceSchemaConfig#SCHEMA_VERSION} is cached.
@@ -325,6 +324,12 @@ public class SegmentSchemaCache
     );
   }
 
+  @VisibleForTesting
+  SchemaPayloadPlus getTemporaryPublishedMetadataQueryResults(SegmentId id)
+  {
+    return temporaryPublishedMetadataQueryResults.get(id);
+  }
+
   /**
    * This class encapsulates schema information for segments polled from the DB.
    */
diff --git a/server/src/test/java/org/apache/druid/segment/metadata/SegmentSchemaCacheTest.java b/server/src/test/java/org/apache/druid/segment/metadata/SegmentSchemaCacheTest.java
index f89c305b9db..c17fa59d6ba 100644
--- a/server/src/test/java/org/apache/druid/segment/metadata/SegmentSchemaCacheTest.java
+++ b/server/src/test/java/org/apache/druid/segment/metadata/SegmentSchemaCacheTest.java
@@ -63,28 +63,52 @@ public class SegmentSchemaCacheTest
     RowSignature rowSignature = RowSignature.builder().add("cx", ColumnType.FLOAT).build();
     SchemaPayloadPlus expected = new SchemaPayloadPlus(new SchemaPayload(rowSignature, Collections.emptyMap()), 20L);
     SegmentId id = SegmentId.dummy("ds");
+    SegmentId id2 = SegmentId.dummy("ds2");
 
     // this call shouldn't result in any error
     cache.markMetadataQueryResultPublished(id);
 
     cache.addTemporaryMetadataQueryResult(id, rowSignature, Collections.emptyMap(), 20);
+    cache.addTemporaryMetadataQueryResult(id2, rowSignature, Collections.emptyMap(), 20);
 
     Assert.assertTrue(cache.isSchemaCached(id));
+    Assert.assertTrue(cache.isSchemaCached(id2));
     Optional<SchemaPayloadPlus> schema = cache.getSchemaForSegment(id);
     Assert.assertTrue(schema.isPresent());
     Assert.assertEquals(expected, schema.get());
+    Optional<SchemaPayloadPlus> schema2 = cache.getSchemaForSegment(id);
+    Assert.assertTrue(schema2.isPresent());
+    Assert.assertEquals(expected, schema2.get());
 
     cache.markMetadataQueryResultPublished(id);
+    cache.markMetadataQueryResultPublished(id2);
 
     schema = cache.getSchemaForSegment(id);
     Assert.assertTrue(schema.isPresent());
     Assert.assertEquals(expected, schema.get());
 
-    cache.resetTemporaryPublishedMetadataQueryResultOnDBPoll();
+    // simulate call after segment polling
 
-    Assert.assertFalse(cache.isSchemaCached(id));
+    ImmutableMap.Builder<SegmentId, SegmentMetadata> segmentMetadataBuilder = ImmutableMap.builder();
+    segmentMetadataBuilder.put(id, new SegmentMetadata(5L, "fp"));
+
+    ImmutableMap.Builder<String, SchemaPayload> schemaPayloadBuilder = ImmutableMap.builder();
+    schemaPayloadBuilder.put("fp", new SchemaPayload(rowSignature));
+
+    SegmentSchemaCache.FinalizedSegmentSchemaInfo finalizedSegmentSchemaInfo =
+        new SegmentSchemaCache.FinalizedSegmentSchemaInfo(segmentMetadataBuilder.build(), schemaPayloadBuilder.build());
+
+    cache.updateFinalizedSegmentSchema(finalizedSegmentSchemaInfo);
+
+    Assert.assertNull(cache.getTemporaryPublishedMetadataQueryResults(id));
+    Assert.assertNotNull(cache.getTemporaryPublishedMetadataQueryResults(id2));
+    Assert.assertTrue(cache.isSchemaCached(id));
+    Assert.assertTrue(cache.isSchemaCached(id2));
     schema = cache.getSchemaForSegment(id);
-    Assert.assertFalse(schema.isPresent());
+    Assert.assertTrue(schema.isPresent());
+
+    schema2 = cache.getSchemaForSegment(id2);
+    Assert.assertTrue(schema2.isPresent());
   }
 
   @Test

From 34c80ee3de68bfc46308ed0c920e20276224e4b3 Mon Sep 17 00:00:00 2001
From: Akshat Jain <akjn11@gmail.com>
Date: Fri, 28 Jun 2024 11:14:17 +0530
Subject: [PATCH 38/72] Add MSQ engine support for window function drill tests
 (#16665)

* Add MSQ engine support for window function drill tests

* Address review comments

* Revert formatting changes in TestDataBuilder
---
 .../msq/exec/MSQDrillWindowQueryTest.java     |  94 ++++++++++
 .../druid/msq/test/CalciteMSQTestsHelper.java |   7 +
 .../calcite/CalciteNestedDataQueryTest.java   |   1 +
 .../sql/calcite/DrillWindowQueryTest.java     | 171 +++--------------
 .../druid/sql/calcite/NotYetSupported.java    |   2 +-
 .../druid/sql/calcite/QueryTestRunner.java    |  11 +-
 .../druid/sql/calcite/util/CalciteTests.java  |   5 +
 .../sql/calcite/util/TestDataBuilder.java     | 176 ++++++++++++++++++
 8 files changed, 308 insertions(+), 159 deletions(-)
 create mode 100644 extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQDrillWindowQueryTest.java

diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQDrillWindowQueryTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQDrillWindowQueryTest.java
new file mode 100644
index 00000000000..d3a67fdd659
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQDrillWindowQueryTest.java
@@ -0,0 +1,94 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.exec;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.collect.ImmutableList;
+import com.google.inject.Injector;
+import com.google.inject.Module;
+import org.apache.druid.guice.DruidInjectorBuilder;
+import org.apache.druid.msq.exec.MSQDrillWindowQueryTest.DrillWindowQueryMSQComponentSupplier;
+import org.apache.druid.msq.sql.MSQTaskSqlEngine;
+import org.apache.druid.msq.test.CalciteMSQTestsHelper;
+import org.apache.druid.msq.test.ExtractResultsFactory;
+import org.apache.druid.msq.test.MSQTestOverlordServiceClient;
+import org.apache.druid.msq.test.MSQTestTaskActionClient;
+import org.apache.druid.msq.test.VerifyMSQSupportedNativeQueriesPredicate;
+import org.apache.druid.query.groupby.TestGroupByBuffers;
+import org.apache.druid.server.QueryLifecycleFactory;
+import org.apache.druid.sql.calcite.DrillWindowQueryTest;
+import org.apache.druid.sql.calcite.QueryTestBuilder;
+import org.apache.druid.sql.calcite.SqlTestFrameworkConfig;
+import org.apache.druid.sql.calcite.TempDirProducer;
+import org.apache.druid.sql.calcite.run.SqlEngine;
+
+@SqlTestFrameworkConfig.ComponentSupplier(DrillWindowQueryMSQComponentSupplier.class)
+public class MSQDrillWindowQueryTest extends DrillWindowQueryTest
+{
+  public static class DrillWindowQueryMSQComponentSupplier extends DrillComponentSupplier
+  {
+    public DrillWindowQueryMSQComponentSupplier(TempDirProducer tempFolderProducer)
+    {
+      super(tempFolderProducer);
+    }
+
+    @Override
+    public void configureGuice(DruidInjectorBuilder builder)
+    {
+      super.configureGuice(builder);
+      builder.addModules(CalciteMSQTestsHelper.fetchModules(tempDirProducer::newTempFolder, TestGroupByBuffers.createDefault()).toArray(new Module[0]));
+    }
+
+    @Override
+    public SqlEngine createEngine(
+        QueryLifecycleFactory qlf,
+        ObjectMapper queryJsonMapper,
+        Injector injector
+    )
+    {
+      final WorkerMemoryParameters workerMemoryParameters =
+          WorkerMemoryParameters.createInstance(
+              WorkerMemoryParameters.PROCESSING_MINIMUM_BYTES * 50,
+              2,
+              10,
+              2,
+              0,
+              0
+          );
+      final MSQTestOverlordServiceClient indexingServiceClient = new MSQTestOverlordServiceClient(
+          queryJsonMapper,
+          injector,
+          new MSQTestTaskActionClient(queryJsonMapper, injector),
+          workerMemoryParameters,
+          ImmutableList.of()
+      );
+      return new MSQTaskSqlEngine(indexingServiceClient, queryJsonMapper);
+    }
+  }
+
+  @Override
+  protected QueryTestBuilder testBuilder()
+  {
+    return new QueryTestBuilder(new CalciteTestConfig(true))
+        .addCustomRunner(new ExtractResultsFactory(() -> (MSQTestOverlordServiceClient) ((MSQTaskSqlEngine) queryFramework().engine()).overlordClient()))
+        .skipVectorize(true)
+        .verifyNativeQueries(new VerifyMSQSupportedNativeQueriesPredicate());
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/CalciteMSQTestsHelper.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/CalciteMSQTestsHelper.java
index a144a0b3594..54552e5d5b0 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/CalciteMSQTestsHelper.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/CalciteMSQTestsHelper.java
@@ -391,6 +391,13 @@ public class CalciteMSQTestsHelper
       case CalciteTests.WIKIPEDIA_FIRST_LAST:
         index = TestDataBuilder.makeWikipediaIndexWithAggregation(tempFolderProducer.apply("tmpDir"));
         break;
+      case CalciteTests.TBL_WITH_NULLS_PARQUET:
+      case CalciteTests.SML_TBL_PARQUET:
+      case CalciteTests.ALL_TYPES_UNIQ_PARQUET:
+      case CalciteTests.FEW_ROWS_ALL_DATA_PARQUET:
+      case CalciteTests.T_ALL_TYPE_PARQUET:
+        index = TestDataBuilder.getQueryableIndexForDrillDatasource(segmentId.getDataSource(), tempFolderProducer.apply("tmpDir"));
+        break;
       default:
         throw new ISE("Cannot query segment %s in test runner", segmentId);
 
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteNestedDataQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteNestedDataQueryTest.java
index 95a4d0c1c32..e2bc9d45eb2 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteNestedDataQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteNestedDataQueryTest.java
@@ -6870,6 +6870,7 @@ public class CalciteNestedDataQueryTest extends BaseCalciteQueryTest
   @Test
   public void testJsonQueryArrays()
   {
+    msqIncompatible();
     testBuilder()
         .sql("SELECT JSON_QUERY_ARRAY(arrayObject, '$') FROM druid.arrays")
         .queryContext(QUERY_CONTEXT_DEFAULT)
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java
index ec661f8d315..baeb04fb561 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java
@@ -19,38 +19,22 @@
 
 package org.apache.druid.sql.calcite;
 
-import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.base.Function;
 import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.Iterators;
 import com.google.common.io.ByteStreams;
 import com.google.inject.Injector;
 import org.apache.calcite.sql.SqlNode;
 import org.apache.calcite.sql2rel.SqlToRelConverter;
 import org.apache.commons.io.FileUtils;
 import org.apache.druid.common.config.NullHandling;
-import org.apache.druid.data.input.InputRow;
-import org.apache.druid.data.input.MapBasedInputRow;
-import org.apache.druid.data.input.impl.DimensionSchema;
-import org.apache.druid.data.input.impl.DimensionsSpec;
-import org.apache.druid.data.input.impl.DoubleDimensionSchema;
-import org.apache.druid.data.input.impl.LongDimensionSchema;
-import org.apache.druid.data.input.impl.StringDimensionSchema;
-import org.apache.druid.jackson.DefaultObjectMapper;
-import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.Numbers;
-import org.apache.druid.java.util.common.RE;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.parsers.TimestampParser;
 import org.apache.druid.query.QueryContexts;
 import org.apache.druid.query.QueryRunnerFactoryConglomerate;
-import org.apache.druid.segment.IndexBuilder;
-import org.apache.druid.segment.QueryableIndex;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.RowSignature;
-import org.apache.druid.segment.incremental.IncrementalIndexSchema;
 import org.apache.druid.segment.join.JoinableFactoryWrapper;
-import org.apache.druid.segment.writeout.OnHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.server.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.DisableUnless.DisableUnlessRule;
 import org.apache.druid.sql.calcite.DrillWindowQueryTest.DrillComponentSupplier;
@@ -60,8 +44,7 @@ import org.apache.druid.sql.calcite.QueryTestRunner.QueryResults;
 import org.apache.druid.sql.calcite.planner.PlannerCaptureHook;
 import org.apache.druid.sql.calcite.planner.PlannerContext;
 import org.apache.druid.sql.calcite.util.SqlTestFramework.StandardComponentSupplier;
-import org.apache.druid.timeline.DataSegment;
-import org.apache.druid.timeline.partition.NumberedShardSpec;
+import org.apache.druid.sql.calcite.util.TestDataBuilder;
 import org.joda.time.DateTime;
 import org.joda.time.LocalTime;
 import org.junit.Assert;
@@ -88,7 +71,6 @@ import java.util.Arrays;
 import java.util.Comparator;
 import java.util.List;
 import java.util.Locale;
-import java.util.Map;
 import java.util.Set;
 import java.util.stream.Collectors;
 
@@ -113,8 +95,6 @@ import static org.junit.Assert.fail;
 @SqlTestFrameworkConfig.ComponentSupplier(DrillComponentSupplier.class)
 public class DrillWindowQueryTest extends BaseCalciteQueryTest
 {
-  private static final ObjectMapper MAPPER = new DefaultObjectMapper();
-
   static {
     NullHandling.initializeForTests();
   }
@@ -259,135 +239,9 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
           joinableFactory,
           injector);
 
-      attachIndex(
-          retVal,
-          "tblWnulls.parquet",
-          new LongDimensionSchema("c1"),
-          new StringDimensionSchema("c2"));
-
-      // {"col0":1,"col1":65534,"col2":256.0,"col3":1234.9,"col4":73578580,"col5":1393720082338,"col6":421185052800000,"col7":false,"col8":"CA","col9":"AXXXXXXXXXXXXXXXXXXXXXXXXXCXXXXXXXXXXXXXXXXXXXXXXXXZ"}
-      attachIndex(
-          retVal,
-          "allTypsUniq.parquet",
-          new LongDimensionSchema("col0"),
-          new LongDimensionSchema("col1"),
-          new DoubleDimensionSchema("col2"),
-          new DoubleDimensionSchema("col3"),
-          new LongDimensionSchema("col4"),
-          new LongDimensionSchema("col5"),
-          new LongDimensionSchema("col6"),
-          new StringDimensionSchema("col7"),
-          new StringDimensionSchema("col8"),
-          new StringDimensionSchema("col9"));
-      attachIndex(
-          retVal,
-          "smlTbl.parquet",
-          // "col_int": 8122,
-          new LongDimensionSchema("col_int"),
-          // "col_bgint": 817200,
-          new LongDimensionSchema("col_bgint"),
-          // "col_char_2": "IN",
-          new StringDimensionSchema("col_char_2"),
-          // "col_vchar_52":
-          // "AXXXXXXXXXXXXXXXXXXXXXXXXXCXXXXXXXXXXXXXXXXXXXXXXXXB",
-          new StringDimensionSchema("col_vchar_52"),
-          // "col_tmstmp": 1409617682418,
-          new LongDimensionSchema("col_tmstmp"),
-          // "col_dt": 422717616000000,
-          new LongDimensionSchema("col_dt"),
-          // "col_booln": false,
-          new StringDimensionSchema("col_booln"),
-          // "col_dbl": 12900.48,
-          new DoubleDimensionSchema("col_dbl"),
-          // "col_tm": 33109170
-          new LongDimensionSchema("col_tm"));
-      attachIndex(
-          retVal,
-          "fewRowsAllData.parquet",
-          // "col0":12024,
-          new LongDimensionSchema("col0"),
-          // "col1":307168,
-          new LongDimensionSchema("col1"),
-          // "col2":"VT",
-          new StringDimensionSchema("col2"),
-          // "col3":"DXXXXXXXXXXXXXXXXXXXXXXXXXEXXXXXXXXXXXXXXXXXXXXXXXXF",
-          new StringDimensionSchema("col3"),
-          // "col4":1338596882419,
-          new LongDimensionSchema("col4"),
-          // "col5":422705433600000,
-          new LongDimensionSchema("col5"),
-          // "col6":true,
-          new StringDimensionSchema("col6"),
-          // "col7":3.95110006277E8,
-          new DoubleDimensionSchema("col7"),
-          // "col8":67465430
-          new LongDimensionSchema("col8"));
-      attachIndex(
-          retVal,
-          "t_alltype.parquet",
-          // "c1":1,
-          new LongDimensionSchema("c1"),
-          // "c2":592475043,
-          new LongDimensionSchema("c2"),
-          // "c3":616080519999272,
-          new LongDimensionSchema("c3"),
-          // "c4":"ObHeWTDEcbGzssDwPwurfs",
-          new StringDimensionSchema("c4"),
-          // "c5":"0sZxIfZ CGwTOaLWZ6nWkUNx",
-          new StringDimensionSchema("c5"),
-          // "c6":1456290852307,
-          new LongDimensionSchema("c6"),
-          // "c7":421426627200000,
-          new LongDimensionSchema("c7"),
-          // "c8":true,
-          new StringDimensionSchema("c8"),
-          // "c9":0.626179100469
-          new DoubleDimensionSchema("c9"));
-
-      return retVal;
-    }
-
-    @SuppressWarnings({"rawtypes", "unchecked"})
-    private void attachIndex(SpecificSegmentsQuerySegmentWalker texasRanger, String dataSource, DimensionSchema... dims)
-    {
-      ArrayList<String> dimensionNames = new ArrayList<>(dims.length);
-      for (DimensionSchema dimension : dims) {
-        dimensionNames.add(dimension.getName());
-      }
-
       final File tmpFolder = tempDirProducer.newTempFolder();
-      final QueryableIndex queryableIndex = IndexBuilder
-          .create()
-          .tmpDir(new File(tmpFolder, dataSource))
-          .segmentWriteOutMediumFactory(OnHeapMemorySegmentWriteOutMediumFactory.instance())
-          .schema(new IncrementalIndexSchema.Builder()
-              .withRollup(false)
-              .withDimensionsSpec(new DimensionsSpec(Arrays.asList(dims)))
-              .build())
-          .rows(
-              () -> {
-                try {
-                  return Iterators.transform(
-                      MAPPER.readerFor(Map.class)
-                          .readValues(
-                              ClassLoader.getSystemResource("drill/window/datasources/" + dataSource + ".json")),
-                      (Function<Map, InputRow>) input -> new MapBasedInputRow(0, dimensionNames, input));
-                }
-                catch (IOException e) {
-                  throw new RE(e, "problem reading file");
-                }
-              })
-          .buildMMappedIndex();
-
-      texasRanger.add(
-          DataSegment.builder()
-              .dataSource(dataSource)
-              .interval(Intervals.ETERNITY)
-              .version("1")
-              .shardSpec(new NumberedShardSpec(0, 0))
-              .size(0)
-              .build(),
-          queryableIndex);
+      TestDataBuilder.attachIndexesForDrillTestDatasources(retVal, tmpFolder);
+      return retVal;
     }
   }
 
@@ -421,7 +275,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
       try {
         Assert.assertEquals(StringUtils.format("result count: %s", sql), expectedResultsText.size(), results.size());
         if (!isOrdered(queryResults)) {
-          // in case the resultset is not ordered; order via the same comparator before comparision
+          // in case the resultset is not ordered; order via the same comparator before comparison
           results.sort(new ArrayRowCmp());
           expectedResults.sort(new ArrayRowCmp());
         }
@@ -4410,6 +4264,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_aggregates_winFnQry_83()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -6302,6 +6157,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_aggregates_winFnQry_84()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -6309,6 +6165,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_aggregates_winFnQry_85()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -6694,6 +6551,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_avg_mulwds()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -6701,6 +6559,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_count_mulwds()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -6708,6 +6567,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_fval_mulwds()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -6715,6 +6575,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_lval_mulwds()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -6722,6 +6583,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_mulwind_08()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -6729,6 +6591,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_mulwind_09()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -6736,6 +6599,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_sum_mulwds()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -7508,6 +7372,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_rnkNoFrm01()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -7515,6 +7380,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_rnkNoFrm02()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -7522,6 +7388,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_rnkNoFrm03()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -7529,6 +7396,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_rnkNoFrm04()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -7536,6 +7404,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_rnkNoFrm05()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -7543,6 +7412,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_frameclause_multipl_wnwds_rnkNoFrm06()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
@@ -7655,6 +7525,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
   @Test
   public void test_nestedAggs_multiWin_6()
   {
+    msqIncompatible();
     windowQueryTest();
   }
 
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/NotYetSupported.java b/sql/src/test/java/org/apache/druid/sql/calcite/NotYetSupported.java
index d1a0c4ec883..a3f6208f112 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/NotYetSupported.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/NotYetSupported.java
@@ -171,7 +171,7 @@ public @interface NotYetSupported
           Matcher m = annotation.value().getPattern().matcher(trace);
 
           if (!m.find()) {
-            throw new AssertionError("Exception stactrace doesn't match regex: " + annotation.value().regex, e);
+            throw new AssertionError("Exception stacktrace doesn't match regex: " + annotation.value().regex, e);
           }
           throw new AssumptionViolatedException("Test is not-yet supported; ignored with:" + annotation);
         }
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestRunner.java b/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestRunner.java
index 3430e10edfc..61678497fc8 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestRunner.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestRunner.java
@@ -356,15 +356,12 @@ public class QueryTestRunner
   public static class VerifyResults implements QueryVerifyStep
   {
     protected final BaseExecuteQuery execStep;
-    protected final boolean verifyRowSignature;
 
     public VerifyResults(
-        BaseExecuteQuery execStep,
-        boolean verifyRowSignature
+        BaseExecuteQuery execStep
     )
     {
       this.execStep = execStep;
-      this.verifyRowSignature = verifyRowSignature;
     }
 
     @Override
@@ -386,9 +383,7 @@ public class QueryTestRunner
       }
 
       QueryTestBuilder builder = execStep.builder();
-      if (verifyRowSignature) {
-        builder.expectedResultsVerifier.verifyRowSignature(queryResults.signature);
-      }
+      builder.expectedResultsVerifier.verifyRowSignature(queryResults.signature);
       builder.expectedResultsVerifier.verify(builder.sql, queryResults);
     }
   }
@@ -747,7 +742,7 @@ public class QueryTestRunner
       if (builder.expectedResultsVerifier != null) {
         // Don't verify the row signature when MSQ is running, since the broker receives the task id, and the signature
         // would be {TASK:STRING} instead of the expected results signature
-        verifySteps.add(new VerifyResults(finalExecStep, !config.isRunningMSQ()));
+        verifySteps.add(new VerifyResults(finalExecStep));
       }
 
       if (!builder.customVerifications.isEmpty()) {
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/util/CalciteTests.java b/sql/src/test/java/org/apache/druid/sql/calcite/util/CalciteTests.java
index 2594d2e98dc..3fdbafb71a8 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/util/CalciteTests.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/util/CalciteTests.java
@@ -125,6 +125,11 @@ public class CalciteTests
   public static final String DRUID_SCHEMA_NAME = "druid";
   public static final String WIKIPEDIA = "wikipedia";
   public static final String WIKIPEDIA_FIRST_LAST = "wikipedia_first_last";
+  public static final String TBL_WITH_NULLS_PARQUET = "tblWnulls.parquet";
+  public static final String SML_TBL_PARQUET = "smlTbl.parquet";
+  public static final String ALL_TYPES_UNIQ_PARQUET = "allTypsUniq.parquet";
+  public static final String FEW_ROWS_ALL_DATA_PARQUET = "fewRowsAllData.parquet";
+  public static final String T_ALL_TYPE_PARQUET = "t_alltype.parquet";
 
   public static final String TEST_SUPERUSER_NAME = "testSuperuser";
   public static final AuthorizerMapper TEST_AUTHORIZER_MAPPER = new AuthorizerMapper(null)
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/util/TestDataBuilder.java b/sql/src/test/java/org/apache/druid/sql/calcite/util/TestDataBuilder.java
index f732771991c..1f6b17e2ca2 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/util/TestDataBuilder.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/util/TestDataBuilder.java
@@ -19,9 +19,12 @@
 
 package org.apache.druid.sql.calcite.util;
 
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.base.Function;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
+import com.google.common.collect.Iterators;
 import com.google.inject.Injector;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.data.input.InputRowSchema;
@@ -36,8 +39,10 @@ import org.apache.druid.data.input.impl.LongDimensionSchema;
 import org.apache.druid.data.input.impl.MapInputRowParser;
 import org.apache.druid.data.input.impl.StringDimensionSchema;
 import org.apache.druid.data.input.impl.TimestampSpec;
+import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.RE;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.parsers.JSONPathSpec;
 import org.apache.druid.query.DataSource;
@@ -102,6 +107,8 @@ import java.util.stream.Collectors;
  */
 public class TestDataBuilder
 {
+  private static final ObjectMapper MAPPER = new DefaultObjectMapper();
+
   public static final String TIMESTAMP_COLUMN = "t";
   public static final GlobalTableDataSource CUSTOM_TABLE = new GlobalTableDataSource(CalciteTests.BROADCAST_DATASOURCE);
 
@@ -962,6 +969,175 @@ public class TestDataBuilder
     );
   }
 
+  public static void attachIndexesForDrillTestDatasources(SpecificSegmentsQuerySegmentWalker segmentWalker, File tmpDir)
+  {
+    attachIndexForDrillTestDatasource(segmentWalker, CalciteTests.TBL_WITH_NULLS_PARQUET, tmpDir);
+    attachIndexForDrillTestDatasource(segmentWalker, CalciteTests.SML_TBL_PARQUET, tmpDir);
+    attachIndexForDrillTestDatasource(segmentWalker, CalciteTests.ALL_TYPES_UNIQ_PARQUET, tmpDir);
+    attachIndexForDrillTestDatasource(segmentWalker, CalciteTests.FEW_ROWS_ALL_DATA_PARQUET, tmpDir);
+    attachIndexForDrillTestDatasource(segmentWalker, CalciteTests.T_ALL_TYPE_PARQUET, tmpDir);
+  }
+
+  @SuppressWarnings({"rawtypes", "unchecked"})
+  private static void attachIndexForDrillTestDatasource(
+      SpecificSegmentsQuerySegmentWalker segmentWalker,
+      String dataSource,
+      File tmpDir
+  )
+  {
+    final QueryableIndex queryableIndex = getQueryableIndexForDrillDatasource(dataSource, tmpDir);
+
+    segmentWalker.add(
+        DataSegment.builder()
+                   .dataSource(dataSource)
+                   .interval(Intervals.ETERNITY)
+                   .version("1")
+                   .shardSpec(new NumberedShardSpec(0, 0))
+                   .size(0)
+                   .build(),
+        queryableIndex);
+  }
+
+  public static QueryableIndex getQueryableIndexForDrillDatasource(String datasource, File parentTempDir)
+  {
+    final IncrementalIndexSchema indexSchema = new IncrementalIndexSchema.Builder()
+        .withDimensionsSpec(getDimensionSpecForDrillDatasource(datasource))
+        .withRollup(false)
+        .build();
+    Iterable<InputRow> inputRowsForDrillDatasource = getInputRowsForDrillDatasource(datasource);
+    return IndexBuilder
+        .create()
+        .tmpDir(new File(parentTempDir, datasource))
+        .segmentWriteOutMediumFactory(OffHeapMemorySegmentWriteOutMediumFactory.instance())
+        .schema(indexSchema)
+        .rows(inputRowsForDrillDatasource)
+        .buildMMappedIndex();
+  }
+
+  private static DimensionsSpec getDimensionSpecForDrillDatasource(String datasource)
+  {
+    switch (datasource) {
+      case CalciteTests.TBL_WITH_NULLS_PARQUET: {
+        return new DimensionsSpec(
+            ImmutableList.of(
+                new LongDimensionSchema("c1"),
+                new StringDimensionSchema("c2")
+            )
+        );
+      }
+      case CalciteTests.SML_TBL_PARQUET: {
+        return new DimensionsSpec(
+            ImmutableList.of(
+                // "col_int": 8122,
+                new LongDimensionSchema("col_int"),
+                // "col_bgint": 817200,
+                new LongDimensionSchema("col_bgint"),
+                // "col_char_2": "IN",
+                new StringDimensionSchema("col_char_2"),
+                // "col_vchar_52":
+                // "AXXXXXXXXXXXXXXXXXXXXXXXXXCXXXXXXXXXXXXXXXXXXXXXXXXB",
+                new StringDimensionSchema("col_vchar_52"),
+                // "col_tmstmp": 1409617682418,
+                new LongDimensionSchema("col_tmstmp"),
+                // "col_dt": 422717616000000,
+                new LongDimensionSchema("col_dt"),
+                // "col_booln": false,
+                new StringDimensionSchema("col_booln"),
+                // "col_dbl": 12900.48,
+                new DoubleDimensionSchema("col_dbl"),
+                // "col_tm": 33109170
+                new LongDimensionSchema("col_tm")
+            )
+        );
+      }
+      case CalciteTests.ALL_TYPES_UNIQ_PARQUET: {
+        // {"col0":1,"col1":65534,"col2":256.0,"col3":1234.9,"col4":73578580,"col5":1393720082338,"col6":421185052800000,"col7":false,"col8":"CA","col9":"AXXXXXXXXXXXXXXXXXXXXXXXXXCXXXXXXXXXXXXXXXXXXXXXXXXZ"}
+        return new DimensionsSpec(
+            ImmutableList.of(
+                new LongDimensionSchema("col0"),
+                new LongDimensionSchema("col1"),
+                new DoubleDimensionSchema("col2"),
+                new DoubleDimensionSchema("col3"),
+                new LongDimensionSchema("col4"),
+                new LongDimensionSchema("col5"),
+                new LongDimensionSchema("col6"),
+                new StringDimensionSchema("col7"),
+                new StringDimensionSchema("col8"),
+                new StringDimensionSchema("col9")
+            )
+        );
+      }
+      case CalciteTests.FEW_ROWS_ALL_DATA_PARQUET: {
+        return new DimensionsSpec(
+            ImmutableList.of(
+                // "col0":12024,
+                new LongDimensionSchema("col0"),
+                // "col1":307168,
+                new LongDimensionSchema("col1"),
+                // "col2":"VT",
+                new StringDimensionSchema("col2"),
+                // "col3":"DXXXXXXXXXXXXXXXXXXXXXXXXXEXXXXXXXXXXXXXXXXXXXXXXXXF",
+                new StringDimensionSchema("col3"),
+                // "col4":1338596882419,
+                new LongDimensionSchema("col4"),
+                // "col5":422705433600000,
+                new LongDimensionSchema("col5"),
+                // "col6":true,
+                new StringDimensionSchema("col6"),
+                // "col7":3.95110006277E8,
+                new DoubleDimensionSchema("col7"),
+                // "col8":67465430
+                new LongDimensionSchema("col8")
+            )
+        );
+      }
+      case CalciteTests.T_ALL_TYPE_PARQUET: {
+        return new DimensionsSpec(
+            ImmutableList.of(
+                // "c1":1,
+                new LongDimensionSchema("c1"),
+                // "c2":592475043,
+                new LongDimensionSchema("c2"),
+                // "c3":616080519999272,
+                new LongDimensionSchema("c3"),
+                // "c4":"ObHeWTDEcbGzssDwPwurfs",
+                new StringDimensionSchema("c4"),
+                // "c5":"0sZxIfZ CGwTOaLWZ6nWkUNx",
+                new StringDimensionSchema("c5"),
+                // "c6":1456290852307,
+                new LongDimensionSchema("c6"),
+                // "c7":421426627200000,
+                new LongDimensionSchema("c7"),
+                // "c8":true,
+                new StringDimensionSchema("c8"),
+                // "c9":0.626179100469
+                new DoubleDimensionSchema("c9")
+            )
+        );
+      }
+      default:
+        throw new RuntimeException("Invalid datasource supplied for drill tests");
+    }
+  }
+
+  private static Iterable<InputRow> getInputRowsForDrillDatasource(String datasource)
+  {
+    DimensionsSpec dimensionSpecForDrillDatasource = getDimensionSpecForDrillDatasource(datasource);
+    return () -> {
+      try {
+        return Iterators.transform(
+              MAPPER.readerFor(Map.class)
+                    .readValues(
+                        ClassLoader.getSystemResource("drill/window/datasources/" + datasource + ".json")),
+              (Function<Map, InputRow>) input -> new MapBasedInputRow(0, dimensionSpecForDrillDatasource.getDimensionNames(), input)
+        );
+      }
+      catch (IOException e) {
+        throw new RE(e, "problem reading file");
+      }
+    };
+  }
+
   private static MapBasedInputRow toRow(String time, List<String> dimensions, Map<String, Object> event)
   {
     return new MapBasedInputRow(DateTimes.ISO_DATE_OPTIONAL_TIME.parse(time), dimensions, event);

From bd49ecfd29dbcac4926346148dd3cacea294cbff Mon Sep 17 00:00:00 2001
From: Jill Osborne <jill.osborne@imply.io>
Date: Mon, 1 Jul 2024 22:22:47 +0100
Subject: [PATCH 39/72] Addition to subquery limit migration guide (#16671)

Co-authored-by: Laksh Singla <lakshsingla@gmail.com>
Co-authored-by: Victoria Lim <vtlim@users.noreply.github.com>
---
 docs/release-info/migr-subquery-limit.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/release-info/migr-subquery-limit.md b/docs/release-info/migr-subquery-limit.md
index 853be50294d..6801aafdc7b 100644
--- a/docs/release-info/migr-subquery-limit.md
+++ b/docs/release-info/migr-subquery-limit.md
@@ -52,6 +52,10 @@ This property takes precedence over `maxSubqueryRows`.
 You can set both `maxSubqueryRows` and `maxSubqueryBytes` at cluster level and override them in individual queries. 
 See [Overriding default query context values](../configuration#overriding-default-query-context-values) for more information.
 
+Make sure you enable the Broker monitor `SubqueryCountStatsMonitor` so that Druid emits metrics for subquery statistics.
+To do this, add `org.apache.druid.server.metrics.SubqueryCountStatsMonitor` to the `druid.monitoring.monitors` property in your Broker's `runtime.properties` configuration file.
+See [Metrics monitors](../configuration/index.md#metrics-monitors) for more information.
+
 ## Learn more
 
 See the following topics for more information:

From 5e05858ff7d3a79addd6710030b6289cb3dc1cc4 Mon Sep 17 00:00:00 2001
From: zachjsh <zachjsh@gmail.com>
Date: Tue, 2 Jul 2024 12:14:28 -0400
Subject: [PATCH 40/72] Catalog granularity accepts query format (#16680)

Previously, the segment granularity for tables in the catalog had to be defined in period format, ie `'PT1H'` , `'P1D'`, etc. This disallows a user from defining segment granularity of `'ALL'` for a table in the catalog, which may be a valid use case. This change makes it so that a user may define the segment granularity of a table in the catalog, as any string that results in a valid granularity using either the `Granularity.fromString(str)` method, or `new PeriodGranularity(new Period(value), null, null)`, and that granularity maps to a standard supported granularity, where `GranularityType.isStandard(granularity)` returns true. As a result a user may who wants to assign a catalog table's segment granularity to be hourly, may assign the segment granularity property of the table to be either `PT1H`, or `HOUR`. These are the same formats accepted at query time.
---
 .../catalog/ITCatalogIngestAndQueryTest.java  |  4 +--
 .../druid/catalog/model/CatalogUtils.java     | 27 ++++++++++---------
 .../model/facade/DatasourceFacade.java        |  3 +++
 3 files changed, 20 insertions(+), 14 deletions(-)

diff --git a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/catalog/ITCatalogIngestAndQueryTest.java b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/catalog/ITCatalogIngestAndQueryTest.java
index 3dc3c4f5d90..29dee7329cb 100644
--- a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/catalog/ITCatalogIngestAndQueryTest.java
+++ b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/catalog/ITCatalogIngestAndQueryTest.java
@@ -109,7 +109,7 @@ public abstract class ITCatalogIngestAndQueryTest
   {
     String queryFile = "/catalog/implicitCast_select.sql";
     String tableName = "testImplicitCast" + operationName;
-    TableMetadata table = TableBuilder.datasource(tableName, "P1D")
+    TableMetadata table = TableBuilder.datasource(tableName, "DAY")
         .column(Columns.TIME_COLUMN, Columns.LONG)
         .column("double_col1", "DOUBLE")
         .build();
@@ -179,7 +179,7 @@ public abstract class ITCatalogIngestAndQueryTest
   {
     String queryFile = "/catalog/clustering_select.sql";
     String tableName = "testWithClusteringFromCatalog" + operationName;
-    TableMetadata table = TableBuilder.datasource(tableName, "P1D")
+    TableMetadata table = TableBuilder.datasource(tableName, "ALL")
         .column(Columns.TIME_COLUMN, Columns.LONG)
         .column("bigint_col1", "BIGINT")
         .property(
diff --git a/server/src/main/java/org/apache/druid/catalog/model/CatalogUtils.java b/server/src/main/java/org/apache/druid/catalog/model/CatalogUtils.java
index 841d592062b..d0ac6c31e76 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/CatalogUtils.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/CatalogUtils.java
@@ -33,6 +33,7 @@ import org.apache.druid.java.util.common.granularity.GranularityType;
 import org.apache.druid.java.util.common.granularity.PeriodGranularity;
 import org.joda.time.Period;
 
+import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
 
 import java.net.URI;
@@ -63,17 +64,25 @@ public class CatalogUtils
    * For the odd interval, the interval name is also accepted (for the other
    * intervals, the interval name is the descriptive string).
    */
-  public static Granularity asDruidGranularity(String value)
+  public static Granularity asDruidGranularity(@Nonnull String value)
   {
-    if (Strings.isNullOrEmpty(value) || value.equalsIgnoreCase(DatasourceDefn.ALL_GRANULARITY)) {
+    if (value.equalsIgnoreCase(DatasourceDefn.ALL_GRANULARITY)) {
       return Granularities.ALL;
     }
+    Granularity granularity;
     try {
-      return new PeriodGranularity(new Period(value), null, null);
+      granularity = Granularity.fromString(value);
     }
     catch (IllegalArgumentException e) {
-      throw new IAE(StringUtils.format("'%s' is an invalid period string", value));
+      try {
+        granularity = new PeriodGranularity(new Period(value), null, null);
+      }
+      catch (IllegalArgumentException e2) {
+        throw new IAE("[%s] is an invalid granularity string.", value);
+      }
     }
+
+    return granularity;
   }
 
   /**
@@ -275,18 +284,12 @@ public class CatalogUtils
     return merged;
   }
 
-  public static void validateGranularity(String value)
+  public static void validateGranularity(final String value)
   {
     if (value == null) {
       return;
     }
-    Granularity granularity;
-    try {
-      granularity = new PeriodGranularity(new Period(value), null, null);
-    }
-    catch (IllegalArgumentException e) {
-      throw new IAE(StringUtils.format("[%s] is an invalid granularity string", value));
-    }
+    final Granularity granularity = asDruidGranularity(value);
     if (!GranularityType.isStandard(granularity)) {
       throw new IAE(
           "Unsupported segment graularity. "
diff --git a/server/src/main/java/org/apache/druid/catalog/model/facade/DatasourceFacade.java b/server/src/main/java/org/apache/druid/catalog/model/facade/DatasourceFacade.java
index 7ac00d9b608..9e4c2d9df6a 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/facade/DatasourceFacade.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/facade/DatasourceFacade.java
@@ -30,6 +30,8 @@ import org.apache.druid.java.util.common.granularity.Granularity;
 import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.segment.column.ColumnType;
 
+import javax.annotation.Nullable;
+
 import java.util.Collections;
 import java.util.List;
 import java.util.Map;
@@ -122,6 +124,7 @@ public class DatasourceFacade extends TableFacade
     return stringProperty(DatasourceDefn.SEGMENT_GRANULARITY_PROPERTY);
   }
 
+  @Nullable
   public Granularity segmentGranularity()
   {
     String definedGranularity = segmentGranularityString();

From adde024e1117e30a7de71b8a0e3d564c3ac8a305 Mon Sep 17 00:00:00 2001
From: Victoria Lim <vtlim@users.noreply.github.com>
Date: Tue, 2 Jul 2024 12:56:05 -0700
Subject: [PATCH 41/72] docs: Subtitle updates in migration guide overview
 (#16683)

---
 docs/release-info/migration-guide.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/release-info/migration-guide.md b/docs/release-info/migration-guide.md
index ca31fce327f..92053b83a11 100644
--- a/docs/release-info/migration-guide.md
+++ b/docs/release-info/migration-guide.md
@@ -28,7 +28,7 @@ In general, when we introduce new features and behaviors into Apache Druid, we m
 The guides in this section outline breaking changes introduced in Druid 25.0.0 and later. Each guide provides instructions to migrate to new features.
 
 
-## Migrate to arrays from multi-value dimensions
+## Migrate from multi-value dimensions to arrays
 
 Druid now supports SQL-compliant array types. Whenever possible, you should use the array type over multi-value dimensions. See [Migration guide: MVDs to arrays](migr-mvd-array.md).
 
@@ -36,6 +36,6 @@ Druid now supports SQL-compliant array types. Whenever possible, you should use
 
 Druid encodes string columns into dictionaries for better compression. Front-coded dictionary encoding reduces storage and improves performance by optimizing for strings that share similar beginning substrings. See [Migration guide: front-coded dictionaries](migr-front-coded-dict.md) for more information.
 
-## Migrate to `maxSubqueryBytes` from `maxSubqueryRows`
+## Migrate from `maxSubqueryRows` to `maxSubqueryBytes`
 
 Druid allows you to set a byte-based limit on subquery size to prevent Brokers from running out of memory when handling large subqueries. The byte-based subquery limit overrides Druid's row-based subquery limit. We recommend that you move towards using byte-based limits starting in Druid 30.0.0. See [Migration guide: subquery limit](migr-subquery-limit.md) for more information.

From d65e015c94008bc1b6b08ae2a7a43948a03f71a0 Mon Sep 17 00:00:00 2001
From: 317brian <53799971+317brian@users.noreply.github.com>
Date: Tue, 2 Jul 2024 16:45:09 -0700
Subject: [PATCH 42/72] docs: nit for link format (#16687)

---
 docs/release-info/migr-mvd-array.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/release-info/migr-mvd-array.md b/docs/release-info/migr-mvd-array.md
index 6ec9e9ff241..e089a6a733e 100644
--- a/docs/release-info/migr-mvd-array.md
+++ b/docs/release-info/migr-mvd-array.md
@@ -242,5 +242,5 @@ For an example, see [Ingesting arrays: Native batch and streaming ingestion](../
 * For SQL-based batch ingestion, include the [query context parameter](../multi-stage-query/reference.md#context-parameters) `"arrayIngestMode": "array"` and reference the relevant array type (`VARCHAR ARRAY`, `BIGINT ARRAY`, or `DOUBLE ARRAY`) in the [EXTEND clause](../multi-stage-query/reference.md#extern-function) that lists the column names and data types.
 For examples, see [Ingesting arrays: SQL-based ingestion](../querying/arrays.md#sql-based-ingestion).
 
-   As a best practice, always use the ARRAY data type in your input schema. If you want to ingest MVDs, explicitly wrap the string array in [ARRAY_TO_MV](../querying/sql-functions.md#array_to_mv). For an example, see [Multi-value dimensions: SQL-based ingestion](/querying/multi-value-dimensions.md#sql-based-ingestion).
+   As a best practice, always use the ARRAY data type in your input schema. If you want to ingest MVDs, explicitly wrap the string array in [ARRAY_TO_MV](../querying/sql-functions.md#array_to_mv). For an example, see [Multi-value dimensions: SQL-based ingestion](../querying/multi-value-dimensions.md#sql-based-ingestion).
 

From 35b970935f92c16f726df99806043b298260d112 Mon Sep 17 00:00:00 2001
From: Abhishek Radhakrishnan <abhishek.rb19@gmail.com>
Date: Tue, 2 Jul 2024 16:48:34 -0700
Subject: [PATCH 43/72] Better error handling when retrieving Avro schemas from
 registry (#16684)

* Handle RestClientException separately, instead of returning a generic error.

- Add tests
- Clean up the tests; remove the legacy expected exception pattern
- Better test assertions

* Rename tests

* checkstyle fixes
---
 .../SchemaRegistryBasedAvroBytesDecoder.java  |  33 +++-
 ...hemaRegistryBasedAvroBytesDecoderTest.java | 152 ++++++++++++++----
 2 files changed, 147 insertions(+), 38 deletions(-)

diff --git a/extensions-core/avro-extensions/src/main/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoder.java b/extensions-core/avro-extensions/src/main/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoder.java
index 167b036e7d1..c7c7438b1cd 100644
--- a/extensions-core/avro-extensions/src/main/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoder.java
+++ b/extensions-core/avro-extensions/src/main/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoder.java
@@ -139,11 +139,34 @@ public class SchemaRegistryBasedAvroBytesDecoder implements AvroBytesDecoder
       ParsedSchema parsedSchema = registry.getSchemaById(id);
       schema = parsedSchema instanceof AvroSchema ? ((AvroSchema) parsedSchema).rawSchema() : null;
     }
-    catch (IOException | RestClientException ex) {
-      throw new ParseException(null, ex, "Failed to fetch Avro schema id[%s] from registry. Check if the schema "
-                                         + "exists in the registry. Otherwise it could mean that there is "
-                                         + "malformed data in the stream or data that doesn't conform to the schema "
-                                         + "specified.", id);
+    catch (IOException ex1) {
+      throw new ParseException(
+          null,
+          ex1,
+          "Failed to fetch Avro schema id[%s] from registry. Check if the schema exists in the registry. Otherwise it"
+          + " could mean that there is malformed data in the stream or data that doesn't conform to the schema"
+          + " specified.",
+          id
+      );
+    }
+    catch (RestClientException ex2) {
+      if (ex2.getErrorCode() == 401) {
+        throw new ParseException(
+            null,
+            ex2,
+            "Failed to authenticate to schema registry for Avro schema id[%s]. Please check your credentials.",
+            id
+        );
+      }
+      // For all other errors, just include the code and message received from the library.
+      throw new ParseException(
+          null,
+          ex2,
+          "Failed to fetch Avro schema id[%s] from registry. Error code[%s] and message[%s].",
+          id,
+          ex2.getErrorCode(),
+          ex2.getMessage()
+      );
     }
     if (schema == null) {
       throw new ParseException(null, "No Avro schema id[%s] in registry", id);
diff --git a/extensions-core/avro-extensions/src/test/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoderTest.java b/extensions-core/avro-extensions/src/test/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoderTest.java
index 7644b61bb10..2aad88e8ff5 100644
--- a/extensions-core/avro-extensions/src/test/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoderTest.java
+++ b/extensions-core/avro-extensions/src/test/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoderTest.java
@@ -25,6 +25,7 @@ import com.fasterxml.jackson.databind.ObjectMapper;
 import io.confluent.kafka.schemaregistry.ParsedSchema;
 import io.confluent.kafka.schemaregistry.avro.AvroSchema;
 import io.confluent.kafka.schemaregistry.client.SchemaRegistryClient;
+import io.confluent.kafka.schemaregistry.client.rest.exceptions.RestClientException;
 import org.apache.avro.Schema;
 import org.apache.avro.generic.GenericRecord;
 import org.apache.avro.io.DatumWriter;
@@ -61,15 +62,15 @@ public class SchemaRegistryBasedAvroBytesDecoderTest
   @Test
   public void testMultipleUrls() throws Exception
   {
+    // Given
     String json = "{\"urls\":[\"http://localhost\"],\"type\": \"schema_registry\"}";
     ObjectMapper mapper = new DefaultObjectMapper();
     mapper.setInjectableValues(
         new InjectableValues.Std().addValue(ObjectMapper.class, new DefaultObjectMapper())
     );
-    SchemaRegistryBasedAvroBytesDecoder decoder;
-    decoder = (SchemaRegistryBasedAvroBytesDecoder) mapper
-        .readerFor(AvroBytesDecoder.class)
-        .readValue(json);
+
+    // When
+    SchemaRegistryBasedAvroBytesDecoder decoder = mapper.readerFor(AvroBytesDecoder.class).readValue(json);
 
     // Then
     Assert.assertNotEquals(decoder.hashCode(), 0);
@@ -78,15 +79,15 @@ public class SchemaRegistryBasedAvroBytesDecoderTest
   @Test
   public void testUrl() throws Exception
   {
+    // Given
     String json = "{\"url\":\"http://localhost\",\"type\": \"schema_registry\"}";
     ObjectMapper mapper = new DefaultObjectMapper();
     mapper.setInjectableValues(
         new InjectableValues.Std().addValue(ObjectMapper.class, new DefaultObjectMapper())
     );
-    SchemaRegistryBasedAvroBytesDecoder decoder;
-    decoder = (SchemaRegistryBasedAvroBytesDecoder) mapper
-        .readerFor(AvroBytesDecoder.class)
-        .readValue(json);
+
+    // When
+    SchemaRegistryBasedAvroBytesDecoder decoder = mapper.readerFor(AvroBytesDecoder.class).readValue(json);
 
     // Then
     Assert.assertNotEquals(decoder.hashCode(), 0);
@@ -95,15 +96,15 @@ public class SchemaRegistryBasedAvroBytesDecoderTest
   @Test
   public void testConfig() throws Exception
   {
+    // Given
     String json = "{\"url\":\"http://localhost\",\"type\": \"schema_registry\", \"config\":{}}";
     ObjectMapper mapper = new DefaultObjectMapper();
     mapper.setInjectableValues(
         new InjectableValues.Std().addValue(ObjectMapper.class, new DefaultObjectMapper())
     );
-    SchemaRegistryBasedAvroBytesDecoder decoder;
-    decoder = (SchemaRegistryBasedAvroBytesDecoder) mapper
-        .readerFor(AvroBytesDecoder.class)
-        .readValue(json);
+
+    // When
+    SchemaRegistryBasedAvroBytesDecoder decoder = mapper.readerFor(AvroBytesDecoder.class).readValue(json);
 
     // Then
     Assert.assertNotEquals(decoder.hashCode(), 0);
@@ -120,21 +121,33 @@ public class SchemaRegistryBasedAvroBytesDecoderTest
     byte[] bytes = getAvroDatum(schema, someAvroDatum);
     ByteBuffer bb = ByteBuffer.allocate(bytes.length + 5).put((byte) 0).putInt(1234).put(bytes);
     bb.rewind();
+
     // When
-    new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb);
+    GenericRecord parse = new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb);
+
+    // Then
+    Assert.assertEquals(schema, parse.getSchema());
   }
 
-  @Test(expected = ParseException.class)
+  @Test
   public void testParseCorruptedNotEnoughBytesToEvenGetSchemaInfo()
   {
     // Given
     ByteBuffer bb = ByteBuffer.allocate(2).put((byte) 0).put(1, (byte) 1);
     bb.rewind();
-    // When
-    new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb);
+
+    // When / Then
+    final ParseException e = Assert.assertThrows(
+        ParseException.class,
+        () -> new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb)
+    );
+    MatcherAssert.assertThat(
+        e.getMessage(),
+        CoreMatchers.containsString("Failed to decode avro message, not enough bytes to decode (2)")
+    );
   }
 
-  @Test(expected = ParseException.class)
+  @Test
   public void testParseCorruptedPartial() throws Exception
   {
     // Given
@@ -145,19 +158,30 @@ public class SchemaRegistryBasedAvroBytesDecoderTest
     byte[] bytes = getAvroDatum(schema, someAvroDatum);
     ByteBuffer bb = ByteBuffer.allocate(4 + 5).put((byte) 0).putInt(1234).put(bytes, 5, 4);
     bb.rewind();
-    // When
-    new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb);
+
+    // When / Then
+    final ParseException e = Assert.assertThrows(
+        ParseException.class,
+        () -> new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb)
+    );
+    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(IOException.class));
+    MatcherAssert.assertThat(e.getMessage(), CoreMatchers.containsString("Failed to decode Avro message for schema id[1234]"));
   }
 
-  @Test(expected = ParseException.class)
+  @Test
   public void testParseWrongSchemaType() throws Exception
   {
     // Given
     Mockito.when(registry.getSchemaById(ArgumentMatchers.eq(1234))).thenReturn(Mockito.mock(ParsedSchema.class));
     ByteBuffer bb = ByteBuffer.allocate(5).put((byte) 0).putInt(1234);
     bb.rewind();
-    // When
-    new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb);
+
+    // When / Then
+    final ParseException e = Assert.assertThrows(
+        ParseException.class,
+        () -> new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb)
+    );
+    MatcherAssert.assertThat(e.getMessage(), CoreMatchers.containsString("No Avro schema id[1234] in registry"));
   }
 
   @Test
@@ -167,7 +191,8 @@ public class SchemaRegistryBasedAvroBytesDecoderTest
     Mockito.when(registry.getSchemaById(ArgumentMatchers.anyInt())).thenThrow(new IOException("no pasaran"));
     ByteBuffer bb = ByteBuffer.allocate(5).put((byte) 0).putInt(1234);
     bb.rewind();
-    // When
+
+    // When / Then
     final ParseException e = Assert.assertThrows(
         ParseException.class,
         () -> new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb)
@@ -187,17 +212,20 @@ public class SchemaRegistryBasedAvroBytesDecoderTest
   @Test
   public void testParseHeader() throws JsonProcessingException
   {
+    // Given
     String json = "{\"url\":\"http://localhost\",\"type\":\"schema_registry\",\"config\":{},\"headers\":{\"druid.dynamic.config.provider\":{\"type\":\"mapString\", \"config\":{\"registry.header.prop.2\":\"value.2\", \"registry.header.prop.3\":\"value.3\"}},\"registry.header.prop.1\":\"value.1\",\"registry.header.prop.2\":\"value.4\"}}";
     ObjectMapper mapper = new DefaultObjectMapper();
     mapper.setInjectableValues(
         new InjectableValues.Std().addValue(ObjectMapper.class, new DefaultObjectMapper())
     );
-    SchemaRegistryBasedAvroBytesDecoder decoder;
-    decoder = (SchemaRegistryBasedAvroBytesDecoder) mapper
-        .readerFor(AvroBytesDecoder.class)
-        .readValue(json);
+    SchemaRegistryBasedAvroBytesDecoder decoder = mapper.readerFor(AvroBytesDecoder.class).readValue(json);
 
-    Map<String, String> header = DynamicConfigProviderUtils.extraConfigAndSetStringMap(decoder.getHeaders(), SchemaRegistryBasedAvroBytesDecoder.DRUID_DYNAMIC_CONFIG_PROVIDER_KEY, new DefaultObjectMapper());
+    // When
+    Map<String, String> header = DynamicConfigProviderUtils.extraConfigAndSetStringMap(
+        decoder.getHeaders(),
+        SchemaRegistryBasedAvroBytesDecoder.DRUID_DYNAMIC_CONFIG_PROVIDER_KEY,
+        new DefaultObjectMapper()
+    );
 
     // Then
     Assert.assertEquals(3, header.size());
@@ -209,17 +237,20 @@ public class SchemaRegistryBasedAvroBytesDecoderTest
   @Test
   public void testParseConfig() throws JsonProcessingException
   {
+    // Given
     String json = "{\"url\":\"http://localhost\",\"type\":\"schema_registry\",\"config\":{\"druid.dynamic.config.provider\":{\"type\":\"mapString\", \"config\":{\"registry.config.prop.2\":\"value.2\", \"registry.config.prop.3\":\"value.3\"}},\"registry.config.prop.1\":\"value.1\",\"registry.config.prop.2\":\"value.4\"},\"headers\":{}}";
     ObjectMapper mapper = new DefaultObjectMapper();
     mapper.setInjectableValues(
         new InjectableValues.Std().addValue(ObjectMapper.class, new DefaultObjectMapper())
     );
-    SchemaRegistryBasedAvroBytesDecoder decoder;
-    decoder = (SchemaRegistryBasedAvroBytesDecoder) mapper
-        .readerFor(AvroBytesDecoder.class)
-        .readValue(json);
+    SchemaRegistryBasedAvroBytesDecoder decoder = mapper.readerFor(AvroBytesDecoder.class).readValue(json);
 
-    Map<String, ?> config = DynamicConfigProviderUtils.extraConfigAndSetStringMap(decoder.getConfig(), SchemaRegistryBasedAvroBytesDecoder.DRUID_DYNAMIC_CONFIG_PROVIDER_KEY, new DefaultObjectMapper());
+    // When
+    Map<String, ?> config = DynamicConfigProviderUtils.extraConfigAndSetStringMap(
+        decoder.getConfig(),
+        SchemaRegistryBasedAvroBytesDecoder.DRUID_DYNAMIC_CONFIG_PROVIDER_KEY,
+        new DefaultObjectMapper()
+    );
 
     // Then
     Assert.assertEquals(3, config.size());
@@ -227,4 +258,59 @@ public class SchemaRegistryBasedAvroBytesDecoderTest
     Assert.assertEquals("value.2", config.get("registry.config.prop.2"));
     Assert.assertEquals("value.3", config.get("registry.config.prop.3"));
   }
+
+  @Test
+  public void testParseWhenUnauthenticatedException() throws IOException, RestClientException
+  {
+    // Given
+    Mockito.when(registry.getSchemaById(ArgumentMatchers.eq(1234)))
+           .thenThrow(new RestClientException("unauthenticated", 401, 401));
+    GenericRecord someAvroDatum = AvroStreamInputRowParserTest.buildSomeAvroDatum();
+    Schema schema = SomeAvroDatum.getClassSchema();
+    byte[] bytes = getAvroDatum(schema, someAvroDatum);
+    ByteBuffer bb = ByteBuffer.allocate(4 + 5).put((byte) 0).putInt(1234).put(bytes, 5, 4);
+    bb.rewind();
+
+    // When / Then
+    final ParseException e = Assert.assertThrows(
+        ParseException.class,
+        () -> new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb)
+    );
+    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(RestClientException.class));
+    MatcherAssert.assertThat(e.getCause().getMessage(), CoreMatchers.containsString("unauthenticated"));
+    MatcherAssert.assertThat(
+        e.getMessage(),
+        CoreMatchers.containsString(
+            "Failed to authenticate to schema registry for Avro schema id[1234]. Please check your credentials"
+        )
+    );
+  }
+
+  @Test
+  public void testParseWhenResourceNotFoundException() throws IOException, RestClientException
+  {
+    // Given
+    Mockito.when(registry.getSchemaById(ArgumentMatchers.eq(1234)))
+           .thenThrow(new RestClientException("resource doesn't exist", 404, 404));
+    GenericRecord someAvroDatum = AvroStreamInputRowParserTest.buildSomeAvroDatum();
+    Schema schema = SomeAvroDatum.getClassSchema();
+    byte[] bytes = getAvroDatum(schema, someAvroDatum);
+    ByteBuffer bb = ByteBuffer.allocate(4 + 5).put((byte) 0).putInt(1234).put(bytes, 5, 4);
+    bb.rewind();
+
+    // When / Then
+    final ParseException e = Assert.assertThrows(
+        ParseException.class,
+        () -> new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb)
+    );
+    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(RestClientException.class));
+    MatcherAssert.assertThat(e.getCause().getMessage(), CoreMatchers.containsString("resource doesn't exist"));
+    MatcherAssert.assertThat(
+        e.getMessage(),
+        CoreMatchers.containsString(
+            "Failed to fetch Avro schema id[1234] from registry."
+            + " Error code[404] and message[resource doesn't exist; error code: 404]."
+        )
+    );
+  }
 }

From 6c87b1637bbaa57ad8fd44e5f57a4b764d53faf6 Mon Sep 17 00:00:00 2001
From: Kashif Faraz <kashif.faraz@gmail.com>
Date: Tue, 2 Jul 2024 22:48:50 -0700
Subject: [PATCH 44/72] Revert "Downgrade the version of Apache Curator from
 5.5.0 to 5.3.0 to avoid a bug in the new version (#16425)" (#16688)

This reverts commit cb7c2c1e375da239a4740f02ecd898b66bf6e1c3.
---
 extensions-contrib/ddsketch/pom.xml | 1 +
 integration-tests-ex/cases/pom.xml  | 1 +
 licenses.yaml                       | 2 +-
 pom.xml                             | 2 +-
 4 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/extensions-contrib/ddsketch/pom.xml b/extensions-contrib/ddsketch/pom.xml
index f292947c177..7318e953ff7 100644
--- a/extensions-contrib/ddsketch/pom.xml
+++ b/extensions-contrib/ddsketch/pom.xml
@@ -128,6 +128,7 @@
     <dependency>
       <groupId>org.apache.curator</groupId>
       <artifactId>curator-client</artifactId>
+      <version>5.5.0</version>
       <scope>provided</scope>
     </dependency>
     <dependency>
diff --git a/integration-tests-ex/cases/pom.xml b/integration-tests-ex/cases/pom.xml
index 5e38ac407f8..40461dd8ef1 100644
--- a/integration-tests-ex/cases/pom.xml
+++ b/integration-tests-ex/cases/pom.xml
@@ -302,6 +302,7 @@
         <dependency>
             <groupId>org.apache.curator</groupId>
             <artifactId>curator-client</artifactId>
+            <version>5.5.0</version>
         </dependency>
         <dependency>
             <groupId>com.google.cloud</groupId>
diff --git a/licenses.yaml b/licenses.yaml
index 700dc891553..abfc8924898 100644
--- a/licenses.yaml
+++ b/licenses.yaml
@@ -1655,7 +1655,7 @@ name: Apache Curator
 license_category: binary
 module: java-core
 license_name: Apache License version 2.0
-version: 5.3.0
+version: 5.5.0
 libraries:
   - org.apache.curator: curator-client
   - org.apache.curator: curator-framework
diff --git a/pom.xml b/pom.xml
index 0ab73396857..3490fbd0ee7 100644
--- a/pom.xml
+++ b/pom.xml
@@ -75,7 +75,7 @@
         <java.version>8</java.version>
         <project.build.resourceEncoding>UTF-8</project.build.resourceEncoding>
         <aether.version>0.9.0.M2</aether.version>
-        <apache.curator.version>5.3.0</apache.curator.version>
+        <apache.curator.version>5.5.0</apache.curator.version>
         <apache.kafka.version>3.6.1</apache.kafka.version>
         <!-- when updating apache ranger, verify the usage of aws-bundle-sdk vs aws-logs-sdk
         and update as needed in extensions-core/druid-ranger-security/pm.xml  -->

From f290cf083a5ab045ec1a780671f7f58a5dea5652 Mon Sep 17 00:00:00 2001
From: Virushade <70288012+GWphua@users.noreply.github.com>
Date: Wed, 3 Jul 2024 15:52:57 +0800
Subject: [PATCH 45/72] Update examples/bin/dsql scripts to accept Python 3
 (#16677)

* Update examples/bin/dsql scripts to accept Python 3

Remove redundant urllib import

Translating to Python3: Changing xrange to range

Translating to Python3: Changing long to int

Translating to Python3: Change urllib2 methods, and fix encoding/decoding issues

Remove unnecessary import

Add option for Python2

Rename files

* Update examples/bin/dsql

Co-authored-by: Benedict Jin <asdf2014@apache.org>

* Resolve PR comments

Add comment in files indicating updates need to be made in both places

Update examples/bin/dsql

Co-authored-by: Benedict Jin <asdf2014@apache.org>

* Update error output when using Python 2.

Co-authored-by: Abhishek Radhakrishnan <abhishek.rb19@gmail.com>

---------

Co-authored-by: Benedict Jin <asdf2014@apache.org>
Co-authored-by: Abhishek Radhakrishnan <abhishek.rb19@gmail.com>
---
 examples/bin/dsql                         |  13 +-
 examples/bin/{dsql-main => dsql-main-py2} |   5 +
 examples/bin/dsql-main-py3                | 523 ++++++++++++++++++++++
 3 files changed, 538 insertions(+), 3 deletions(-)
 rename examples/bin/{dsql-main => dsql-main-py2} (99%)
 mode change 100755 => 100644
 create mode 100755 examples/bin/dsql-main-py3

diff --git a/examples/bin/dsql b/examples/bin/dsql
index b402e17534d..dd02a9e893c 100755
--- a/examples/bin/dsql
+++ b/examples/bin/dsql
@@ -21,9 +21,16 @@ PWD="$(pwd)"
 WHEREAMI="$(dirname "$0")"
 WHEREAMI="$(cd "$WHEREAMI" && pwd)"
 
-if [ -x "$(command -v python2)" ]
+if [ -x "$(command -v python3)" ]
 then
-  exec python2 "$WHEREAMI/dsql-main" "$@"
+  exec python3 "$WHEREAMI/dsql-main-py3" "$@"
+elif [ -x "$(command -v python2)" ]
+then
+  echo "Warning: Support for Python 2 will be removed in the future. Please consider upgrading to Python 3"
+  exec python2 "$WHEREAMI/dsql-main-py2" "$@"
+elif [ -x "$(command -v python)" ]
+then
+  exec python "$WHEREAMI/dsql-main-py3" "$@"
 else
-  exec "$WHEREAMI/dsql-main" "$@"
+  echo "python interepreter not found"
 fi
diff --git a/examples/bin/dsql-main b/examples/bin/dsql-main-py2
old mode 100755
new mode 100644
similarity index 99%
rename from examples/bin/dsql-main
rename to examples/bin/dsql-main-py2
index c24602739df..d7325447c65
--- a/examples/bin/dsql-main
+++ b/examples/bin/dsql-main-py2
@@ -17,6 +17,11 @@
 # specific language governing permissions and limitations
 # under the License.
 
+# NOTE:
+# Any feature updates to this script must also be reflected in
+# `dsql-main-py3` so that intended changes work for users using
+# Python 2 or 3.
+
 from __future__ import print_function
 
 import argparse
diff --git a/examples/bin/dsql-main-py3 b/examples/bin/dsql-main-py3
new file mode 100755
index 00000000000..bc573f43914
--- /dev/null
+++ b/examples/bin/dsql-main-py3
@@ -0,0 +1,523 @@
+#!/usr/bin/env python
+
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+# NOTE:
+# Any feature updates to this script must also be reflected in
+# `dsql-main-py2` so that intended changes work for users using
+# Python 2 or 3.
+
+import argparse
+import base64
+import collections
+import csv
+import errno
+import json
+import numbers
+import os
+import re
+import readline
+import ssl
+import sys
+import time
+import unicodedata
+import urllib.request
+import urllib.error
+
+class DruidSqlException(Exception):
+  def friendly_message(self):
+    return getattr(self, 'message', 'Query failed')
+
+  def write_to(self, f):
+    f.write('\x1b[31m')
+    f.write(self.friendly_message())
+    f.write('\x1b[0m')
+    f.write('\n')
+    f.flush()
+
+def do_query_with_args(url, sql, context, args):
+  return do_query(url, sql, context, args.timeout, args.user, args.ignore_ssl_verification, args.cafile, args.capath, args.certchain, args.keyfile, args.keypass)
+
+def do_query(url, sql, context, timeout, user, ignore_ssl_verification, ca_file, ca_path, cert_chain, key_file, key_pass):
+  json_decoder = json.JSONDecoder(object_pairs_hook=collections.OrderedDict)
+  try:
+    if timeout <= 0:
+      timeout = None
+      query_context = context
+    elif int(context.get('timeout', 0)) / 1000. < timeout:
+      query_context = context.copy()
+      query_context['timeout'] = timeout * 1000
+
+    sql_json = json.dumps({'query' : sql, 'context' : query_context})
+
+    # SSL stuff
+    ssl_context = None
+    if ignore_ssl_verification or ca_file is not None or ca_path is not None or cert_chain is not None:
+      ssl_context = ssl.create_default_context()
+      if ignore_ssl_verification:
+        ssl_context.check_hostname = False
+        ssl_context.verify_mode = ssl.CERT_NONE
+      elif ca_path is not None:
+        ssl_context.load_verify_locations(cafile=ca_file, capath=ca_path)
+      else:
+        ssl_context.load_cert_chain(certfile=cert_chain, keyfile=key_file, password=key_pass)
+
+    req = urllib.request.Request(url, sql_json.encode('utf-8'), {'Content-Type' : 'application/json'})
+
+    if user:
+      req.add_header("Authorization", "Basic %s" % base64.b64encode(user.encode('utf-8')).decode('utf-8'))
+
+    response = urllib.request.urlopen(req, None, timeout, context=ssl_context)
+
+    first_chunk = True
+    eof = False
+    buf = ''
+
+    while not eof or len(buf) > 0:
+      while True:
+        try:
+          # Remove starting ','
+          buf = buf.lstrip(',')
+          obj, sz = json_decoder.raw_decode(buf)
+          yield obj
+          buf = buf[sz:]
+        except ValueError as e:
+          # Maybe invalid JSON, maybe partial object; it's hard to tell with this library.
+          if eof and buf.rstrip() == ']':
+            # Stream done and all objects read.
+            buf = ''
+            break
+          elif eof or len(buf) > 256 * 1024:
+            # If we read more than 256KB or if it's eof then report the parse error.
+            raise
+          else:
+            # Stop reading objects, get more from the stream instead.
+            break
+
+      # Read more from the http stream
+      if not eof:
+        chunk = response.read(8192).decode('utf-8')
+        if chunk:
+          buf = buf + chunk
+          if first_chunk:
+            # Remove starting '['
+            buf = buf.lstrip('[')
+        else:
+          # Stream done. Keep reading objects out of buf though.
+          eof = True
+
+  except urllib.error.URLError as e:
+    raise_friendly_error(e)
+
+def raise_friendly_error(e):
+  if isinstance(e, urllib.error.HTTPError):
+    text = e.read().strip()
+    error_obj = {}
+    try:
+      error_obj = dict(json.loads(text))
+    except:
+      pass
+    if e.code == 500 and 'errorMessage' in error_obj:
+      error_text = ''
+      if error_obj['error'] != 'Unknown exception':
+        error_text = error_text + error_obj['error'] + ': '
+      if error_obj['errorClass']:
+        error_text = error_text + str(error_obj['errorClass']) + ': '
+      error_text = error_text + str(error_obj['errorMessage'])
+      if error_obj['host']:
+        error_text = error_text + ' (' + str(error_obj['host']) + ')'
+      raise DruidSqlException(error_text)
+    elif e.code == 405:
+      error_text = 'HTTP Error {0}: {1}\n{2}'.format(e.code, e.reason + " - Are you using the correct broker URL and " +\
+      "is druid.sql.enabled set to true on your broker?", text)
+      raise DruidSqlException(error_text)
+    else:
+      raise DruidSqlException("HTTP Error {0}: {1}\n{2}".format(e.code, e.reason, text))
+  else:
+    raise DruidSqlException(str(e))
+
+def to_utf8(value):
+  if value is None:
+    return b""
+  elif isinstance(value, str):
+    return value.encode("utf-8")
+  else:
+    return str(value).encode("utf-8")
+
+
+def to_tsv(values, delimiter):
+  return delimiter.join(to_utf8(v).replace(delimiter, '') for v in values)
+
+def print_csv(rows, header):
+  csv_writer = csv.writer(sys.stdout)
+  first = True
+  for row in rows:
+    if first and header:
+      csv_writer.writerow(list(to_utf8(k) for k in row.keys()))
+      first = False
+
+    values = []
+    for key, value in row.iteritems():
+      values.append(to_utf8(value))
+
+    csv_writer.writerow(values)
+
+def print_tsv(rows, header, tsv_delimiter):
+  first = True
+  for row in rows:
+    if first and header:
+      print(to_tsv(row.keys(), tsv_delimiter))
+      first = False
+
+    values = []
+    for key, value in row.iteritems():
+      values.append(value)
+
+    print(to_tsv(values, tsv_delimiter))
+
+def print_json(rows):
+  for row in rows:
+    print(json.dumps(row))
+
+def table_to_printable_value(value):
+  # Unicode string, trimmed with control characters removed
+  if value is None:
+    return u"NULL"
+  else:
+    return to_utf8(value).strip().decode('utf-8').translate(dict.fromkeys(range(32)))
+
+def table_compute_string_width(v):
+  normalized = unicodedata.normalize('NFC', v)
+  width = 0
+  for c in normalized:
+    ccategory = unicodedata.category(c)
+    cwidth = unicodedata.east_asian_width(c)
+    if ccategory == 'Cf':
+      # Formatting control, zero width
+      pass
+    elif cwidth == 'F' or cwidth == 'W':
+      # Double-wide character, prints in two columns
+      width = width + 2
+    else:
+      # All other characters
+      width = width + 1
+  return width
+
+def table_compute_column_widths(row_buffer):
+  widths = None
+  for values in row_buffer:
+    values_widths = [table_compute_string_width(v) for v in values]
+    if not widths:
+      widths = values_widths
+    else:
+      i = 0
+      for v in values:
+        widths[i] = max(widths[i], values_widths[i])
+        i = i + 1
+  return widths
+
+def table_print_row(values, column_widths, column_types):
+    vertical_line = '\u2502'
+    for i in range(len(values)):
+        padding = ' ' * max(0, column_widths[i] - table_compute_string_width(values[i]))
+        if column_types and column_types[i] == 'n':
+            print(vertical_line + ' ' + padding + values[i] + ' ', end="")
+        else:
+            print(vertical_line + ' ' + values[i] + padding + ' ', end="")
+    print(vertical_line)
+
+def table_print_header(values, column_widths):
+  # Line 1
+  left_corner = '\u250C'
+  horizontal_line = '\u2500'
+  top_tee = '\u252C'
+  right_corner = '\u2510'
+  print(left_corner, end="")
+  for i in range(0, len(column_widths)):
+    print(horizontal_line * max(0, column_widths[i] + 2), end="")
+    if i + 1 < len(column_widths):
+      print(top_tee, end="")
+  print(right_corner)
+
+  # Line 2
+  table_print_row(values, column_widths, None)
+
+  # Line 3
+  left_tee = '\u251C'
+  cross = '\u253C'
+  right_tee = '\u2524'
+  print(left_tee, end="")
+  for i in range(0, len(column_widths)):
+    print(horizontal_line * max(0, column_widths[i] + 2), end="")
+    if i + 1 < len(column_widths):
+      print(cross, end="")
+  print(right_tee)
+
+
+def table_print_bottom(column_widths):
+  left_corner = '\u2514'
+  right_corner = '\u2518'
+  bottom_tee = '\u2534'
+  horizontal_line = '\u2500'
+  print(left_corner, end="")
+  for i in range(0, len(column_widths)):
+    print(horizontal_line * max(0, column_widths[i] + 2), end="")
+    if i + 1 < len(column_widths):
+      print(bottom_tee, end="")
+  print(right_corner)
+
+
+def table_print_row_buffer(row_buffer, column_widths, column_types):
+  first = True
+  for values in row_buffer:
+    if first:
+      table_print_header(values, column_widths)
+      first = False
+    else:
+      table_print_row(values, column_widths, column_types)
+
+def print_table(rows):
+  start = time.time()
+  nrows = 0
+  first = True
+
+  # Buffer some rows before printing.
+  rows_to_buffer = 500
+  row_buffer = []
+  column_types = []
+  column_widths = None
+
+  for row in rows:
+    nrows = nrows + 1
+
+    if first:
+      row_buffer.append([table_to_printable_value(k) for k in row.keys()])
+      for k in row.keys():
+        if isinstance(row[k], numbers.Number):
+          column_types.append('n')
+        else:
+          column_types.append('s')
+      first = False
+
+    values = [table_to_printable_value(v) for k, v in row.items()]
+    if rows_to_buffer > 0:
+      row_buffer.append(values)
+      rows_to_buffer = rows_to_buffer - 1
+    else:
+      if row_buffer:
+        column_widths = table_compute_column_widths(row_buffer)
+        table_print_row_buffer(row_buffer, column_widths, column_types)
+        del row_buffer[:]
+      table_print_row(values, column_widths, column_types)
+
+  if row_buffer:
+    column_widths = table_compute_column_widths(row_buffer)
+    table_print_row_buffer(row_buffer, column_widths, column_types)
+
+  if column_widths:
+    table_print_bottom(column_widths)
+
+  print("Retrieved {0:,d} row{1:s} in {2:.2f}s.".format(nrows, 's' if nrows != 1 else '', time.time() - start))
+  print("")
+
+def display_query(url, sql, context, args):
+  rows = do_query_with_args(url, sql, context, args)
+
+  if args.format == 'csv':
+    print_csv(rows, args.header)
+  elif args.format == 'tsv':
+    print_tsv(rows, args.header, args.tsv_delimiter)
+  elif args.format == 'json':
+    print_json(rows)
+  elif args.format == 'table':
+    print_table(rows)
+
+def sql_literal_escape(s):
+  if s is None:
+    return "''"
+  elif isinstance(s, str):
+    ustr = s
+  else:
+    ustr = str(s)
+
+  escaped = ["U&'"]
+
+  for c in ustr:
+    ccategory = unicodedata.category(c)
+    if ccategory.startswith('L') or ccategory.startswith('N') or c == ' ':
+      escaped.append(c)
+    else:
+      escaped.append(u'\\')
+      escaped.append('%04x' % ord(c))
+
+  escaped.append("'")
+  return ''.join(escaped)
+
+def make_readline_completer(url, context, args):
+  starters = [
+    'EXPLAIN PLAN FOR',
+    'SELECT'
+  ]
+
+  middlers = [
+    'FROM',
+    'WHERE',
+    'GROUP BY',
+    'ORDER BY',
+    'LIMIT'
+  ]
+
+  def readline_completer(text, state):
+    if readline.get_begidx() == 0:
+      results = [x for x in starters if x.startswith(text.upper())] + [None]
+    else:
+      results = ([x for x in middlers if x.startswith(text.upper())] + [None])
+
+    return results[state] + " "
+
+  print("Connected to [" + args.host + "].")
+  print("")
+
+  return readline_completer
+
+def main():
+  parser = argparse.ArgumentParser(description='Druid SQL command-line client.')
+  parser_cnn = parser.add_argument_group('Connection options')
+  parser_fmt = parser.add_argument_group('Formatting options')
+  parser_oth = parser.add_argument_group('Other options')
+  parser_cnn.add_argument('--host', '-H', type=str, default='http://localhost:8082/', help='Druid query host or url, like https://localhost:8282/')
+  parser_cnn.add_argument('--user', '-u', type=str, help='HTTP basic authentication credentials, like user:password')
+  parser_cnn.add_argument('--timeout', type=int, default=0, help='Timeout in seconds')
+  parser_cnn.add_argument('--cafile', type=str, help='Path to SSL CA file for validating server certificates. See load_verify_locations() in https://docs.python.org/3/library/ssl.html#ssl.SSLContext.')
+  parser_cnn.add_argument('--capath', type=str, help='SSL CA path for validating server certificates. See load_verify_locations() in https://docs.python.org/3/library/ssl.html#ssl.SSLContext.')
+  parser_cnn.add_argument('--ignore-ssl-verification', '-k', action='store_true', default=False, help='Skip verification of SSL certificates.')
+  parser_fmt.add_argument('--format', type=str, default='table', choices=('csv', 'tsv', 'json', 'table'), help='Result format')
+  parser_fmt.add_argument('--header', action='store_true', help='Include header row for formats "csv" and "tsv"')
+  parser_fmt.add_argument('--tsv-delimiter', type=str, default='\t', help='Delimiter for format "tsv"')
+  parser_oth.add_argument('--context-option', '-c', type=str, action='append', help='Set context option for this connection, see https://druid.apache.org/docs/latest/querying/sql.html#connection-context for options')
+  parser_oth.add_argument('--execute', '-e', type=str, help='Execute single SQL query')
+  parser_cnn.add_argument('--certchain', type=str, help='Path to SSL certificate used to connect to server. See load_cert_chain() in https://docs.python.org/3/library/ssl.html#ssl.SSLContext.')
+  parser_cnn.add_argument('--keyfile', type=str, help='Path to private SSL key used to connect to server. See load_cert_chain() in https://docs.python.org/3/library/ssl.html#ssl.SSLContext.')
+  parser_cnn.add_argument('--keypass', type=str, help='Password to private SSL key file used to connect to server. See load_cert_chain() in https://docs.python.org/3/library/ssl.html#ssl.SSLContext.')
+  args = parser.parse_args()
+
+  # Build broker URL
+  url = args.host.rstrip('/') + '/druid/v2/sql/'
+  if not url.startswith('http:') and not url.startswith('https:'):
+    url = 'http://' + url
+
+  # Build context
+  context = {}
+  if args.context_option:
+    for opt in args.context_option:
+      kv = opt.split("=", 1)
+      if len(kv) != 2:
+        raise ValueError('Invalid context option, should be key=value: ' + opt)
+      if re.match(r"^\d+$", kv[1]):
+        context[kv[0]] = int(kv[1])
+      else:
+        context[kv[0]] = kv[1]
+
+  if args.execute:
+    display_query(url, args.execute, context, args)
+  else:
+    # interactive mode
+    print("Welcome to dsql, the command-line client for Druid SQL.")
+
+    readline_history_file = os.path.expanduser("~/.dsql_history")
+    readline.parse_and_bind('tab: complete')
+    readline.set_history_length(500)
+    readline.set_completer(make_readline_completer(url, context, args))
+
+    try:
+      readline.read_history_file(readline_history_file)
+    except IOError:
+      # IOError can happen if the file doesn't exist.
+      pass
+
+    print("Type \"\\h\" for help.")
+
+    while True:
+      sql = ''
+      while not sql.endswith(';'):
+        prompt = "dsql> " if sql == '' else 'more> '
+        try:
+          more_sql = input(prompt)
+        except EOFError:
+          sys.stdout.write('\n')
+          sys.exit(1)
+        if sql == '' and more_sql.startswith('\\'):
+          # backslash command
+          dmatch = re.match(r'^\\d(S?)(\+?)(\s+.*?|)\s*$', more_sql)
+          if dmatch:
+            include_system = dmatch.group(1)
+            extra_info = dmatch.group(2)
+            arg = dmatch.group(3).strip()
+            if arg:
+              sql = "SELECT TABLE_SCHEMA, TABLE_NAME, COLUMN_NAME, DATA_TYPE FROM INFORMATION_SCHEMA.COLUMNS WHERE TABLE_NAME = " + sql_literal_escape(arg)
+              if not include_system:
+                sql = sql + " AND TABLE_SCHEMA = 'druid'"
+              # break to execute sql
+              break
+            else:
+              sql = "SELECT TABLE_SCHEMA, TABLE_NAME FROM INFORMATION_SCHEMA.TABLES"
+              if not include_system:
+                sql = sql + " WHERE TABLE_SCHEMA = 'druid'"
+              # break to execute sql
+              break
+
+          hmatch = re.match(r'^\\h\s*$', more_sql)
+          if hmatch:
+            print("Commands:")
+            print("  \\d             show tables")
+            print("  \\dS            show tables, including system tables")
+            print("  \\d table_name  describe table")
+            print("  \\h             show this help")
+            print("  \\q             exit this program")
+            print("Or enter a SQL query ending with a semicolon (;).")
+            continue
+
+          qmatch = re.match(r'^\\q\s*$', more_sql)
+          if qmatch:
+            sys.exit(0)
+
+          print("No such command: " + more_sql)
+        else:
+          sql = (sql + ' ' + more_sql).strip()
+
+      try:
+        readline.write_history_file(readline_history_file)
+        display_query(url, sql.rstrip(';'), context, args)
+      except DruidSqlException as e:
+        e.write_to(sys.stdout)
+      except KeyboardInterrupt:
+        sys.stdout.write("Query interrupted\n")
+        sys.stdout.flush()
+
+try:
+  main()
+except DruidSqlException as e:
+  e.write_to(sys.stderr)
+  sys.exit(1)
+except KeyboardInterrupt:
+  sys.exit(1)
+except IOError as e:
+  if e.errno == errno.EPIPE:
+    sys.exit(1)
+  else:
+    raise

From 586c713d12964ebe69ce222f9c5ebcc8e8c28403 Mon Sep 17 00:00:00 2001
From: Lars Francke <lars.francke@stackable.tech>
Date: Wed, 3 Jul 2024 17:23:15 +0200
Subject: [PATCH 46/72] Updates build documentation to not mention explicit
 Java version as it was out of sync with the dedicated Java page. (#16674)

This means there is one less place to keep information in sync.
---
 docs/development/build.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/development/build.md b/docs/development/build.md
index 911f25aabbf..e96f37fdc4a 100644
--- a/docs/development/build.md
+++ b/docs/development/build.md
@@ -33,7 +33,7 @@ make sure it has `/master/` in the URL.
 
 ##### Installing Java and Maven
 
-- JDK 8, 8u92+ or JDK 11. See our [Java documentation](../operations/java.md) for information about obtaining a JDK.
+- See our [Java documentation](../operations/java.md) for information about obtaining a supported JDK
 - [Maven version 3.x](http://maven.apache.org/download.cgi)
 
 ##### Other dependencies

From c6c2652c894acb7845f14ab4a782e357711b1eb0 Mon Sep 17 00:00:00 2001
From: Alberic Liu <albericliu8@gmail.com>
Date: Mon, 8 Jul 2024 10:06:24 +0800
Subject: [PATCH 47/72] unified the code format in
 NestedDataOperatorConversions (#16695)

---
 .../NestedDataOperatorConversions.java        | 26 ++++++++++---------
 1 file changed, 14 insertions(+), 12 deletions(-)

diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/expression/builtin/NestedDataOperatorConversions.java b/sql/src/main/java/org/apache/druid/sql/calcite/expression/builtin/NestedDataOperatorConversions.java
index 3fe049bdcb4..a6006046553 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/expression/builtin/NestedDataOperatorConversions.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/expression/builtin/NestedDataOperatorConversions.java
@@ -92,8 +92,9 @@ public class NestedDataOperatorConversions
 
   public static class JsonPathsOperatorConversion implements SqlOperatorConversion
   {
+    private static final String FUNCTION_NAME = "json_paths";
     private static final SqlFunction SQL_FUNCTION = OperatorConversions
-        .operatorBuilder("JSON_PATHS")
+        .operatorBuilder(StringUtils.toUpperCase(FUNCTION_NAME))
         .operandTypeChecker(OperandTypes.ANY)
         .functionCategory(SqlFunctionCategory.USER_DEFINED_FUNCTION)
         .returnTypeArrayWithNullableElements(SqlTypeName.VARCHAR)
@@ -119,7 +120,7 @@ public class NestedDataOperatorConversions
           rexNode,
           druidExpressions -> DruidExpression.ofExpression(
               null,
-              DruidExpression.functionCall("json_paths"),
+              DruidExpression.functionCall(FUNCTION_NAME),
               druidExpressions
           )
       );
@@ -128,8 +129,9 @@ public class NestedDataOperatorConversions
 
   public static class JsonKeysOperatorConversion implements SqlOperatorConversion
   {
+    private static final String FUNCTION_NAME = "json_keys";
     private static final SqlFunction SQL_FUNCTION = OperatorConversions
-        .operatorBuilder("JSON_KEYS")
+        .operatorBuilder(StringUtils.toUpperCase(FUNCTION_NAME))
         .operandNames("expr", "path")
         .operandTypes(SqlTypeFamily.ANY, SqlTypeFamily.STRING)
         .literalOperands(1)
@@ -158,7 +160,7 @@ public class NestedDataOperatorConversions
           rexNode,
           druidExpressions -> DruidExpression.ofExpression(
               ColumnType.STRING_ARRAY,
-              DruidExpression.functionCall("json_keys"),
+              DruidExpression.functionCall(FUNCTION_NAME),
               druidExpressions
           )
       );
@@ -167,9 +169,9 @@ public class NestedDataOperatorConversions
 
   public static class JsonQueryOperatorConversion implements SqlOperatorConversion
   {
-    private static final String FUNCTION_NAME = StringUtils.toUpperCase("json_query");
+    private static final String FUNCTION_NAME = "json_query";
     private static final SqlFunction SQL_FUNCTION = OperatorConversions
-        .operatorBuilder(FUNCTION_NAME)
+        .operatorBuilder(StringUtils.toUpperCase(FUNCTION_NAME))
         .operandTypeChecker(
             OperandTypes.family(
                 SqlTypeFamily.ANY,
@@ -212,7 +214,7 @@ public class NestedDataOperatorConversions
       final Expr pathExpr = plannerContext.parseExpression(druidExpressions.get(1).getExpression());
       if (!pathExpr.isLiteral()) {
         // if path argument is not constant, just use a pure expression
-        return DruidExpression.ofFunctionCall(ColumnType.NESTED_DATA, "json_query", druidExpressions);
+        return DruidExpression.ofFunctionCall(ColumnType.NESTED_DATA, FUNCTION_NAME, druidExpressions);
       }
       // pre-normalize path so that the same expressions with different json path syntax are collapsed
       final String path = (String) pathExpr.eval(InputBindings.nilBindings()).value();
@@ -723,7 +725,7 @@ public class NestedDataOperatorConversions
   {
     private static final String FUNCTION_NAME = "json_object";
     private static final SqlFunction SQL_FUNCTION = OperatorConversions
-        .operatorBuilder(FUNCTION_NAME)
+        .operatorBuilder(StringUtils.toUpperCase(FUNCTION_NAME))
         .operandTypeChecker(OperandTypes.variadic(SqlOperandCountRanges.from(1)))
         .operandTypeInference((callBinding, returnType, operandTypes) -> {
           RelDataTypeFactory typeFactory = callBinding.getTypeFactory();
@@ -756,7 +758,7 @@ public class NestedDataOperatorConversions
           DruidExpression.ofExpression(
               ColumnType.NESTED_DATA,
               null,
-              DruidExpression.functionCall("json_object"),
+              DruidExpression.functionCall(FUNCTION_NAME),
               druidExpressions
           );
 
@@ -809,7 +811,7 @@ public class NestedDataOperatorConversions
           rexNode,
           druidExpressions -> DruidExpression.ofExpression(
               ColumnType.NESTED_DATA,
-              DruidExpression.functionCall("to_json_string"),
+              DruidExpression.functionCall(FUNCTION_NAME),
               druidExpressions
           )
       );
@@ -847,7 +849,7 @@ public class NestedDataOperatorConversions
           rexNode,
           druidExpressions -> DruidExpression.ofExpression(
               ColumnType.NESTED_DATA,
-              DruidExpression.functionCall("parse_json"),
+              DruidExpression.functionCall(FUNCTION_NAME),
               druidExpressions
           )
       );
@@ -885,7 +887,7 @@ public class NestedDataOperatorConversions
           rexNode,
           druidExpressions -> DruidExpression.ofExpression(
               ColumnType.NESTED_DATA,
-              DruidExpression.functionCall("try_parse_json"),
+              DruidExpression.functionCall(FUNCTION_NAME),
               druidExpressions
           )
       );

From bf2be938a93aa3819901bfcc65adac66ce2bc75a Mon Sep 17 00:00:00 2001
From: Abhishek Radhakrishnan <abhishek.rb19@gmail.com>
Date: Sun, 7 Jul 2024 20:59:55 -0700
Subject: [PATCH 48/72] Refactor `SegmentLoadDropHandler` code (#16685)

Motivation:
- Improve code hygeiene
- Make `SegmentLoadDropHandler` easily extensible

Changes:
- Add `SegmentBootstrapper`
- Move code for bootstrapping segments already cached on disk and fetched from coordinator to
`SegmentBootstrapper`.
- No functional change
- Use separate executor service in `SegmentBootstrapper`
- Bind `SegmentBootstrapper` to `ManageLifecycle` explicitly in `CliBroker`, `CliHistorical` etc.
---
 .../coordination/ChangeRequestsSnapshot.java  |   1 -
 .../coordination/SegmentBootstrapper.java     | 439 ++++++++++++++++++
 .../SegmentChangeRequestDrop.java             |   1 -
 .../SegmentChangeRequestLoad.java             |   1 -
 .../coordination/SegmentLoadDropHandler.java  | 384 +--------------
 .../druid/server/http/HistoricalResource.java |  12 +-
 ...java => SegmentBootstrapperCacheTest.java} |  51 +-
 .../coordination/SegmentBootstrapperTest.java | 306 ++++++++++++
 .../SegmentLoadDropHandlerTest.java           | 383 +--------------
 .../coordination/TestSegmentCacheManager.java | 175 +++++++
 .../coordination/ZkCoordinatorTest.java       |   9 +-
 .../java/org/apache/druid/cli/CliBroker.java  |   2 +
 .../org/apache/druid/cli/CliHistorical.java   |   2 +
 .../java/org/apache/druid/cli/CliIndexer.java |   2 +
 .../java/org/apache/druid/cli/CliPeon.java    |   2 +
 15 files changed, 1001 insertions(+), 769 deletions(-)
 create mode 100644 server/src/main/java/org/apache/druid/server/coordination/SegmentBootstrapper.java
 rename server/src/test/java/org/apache/druid/server/coordination/{SegmentLoadDropHandlerCacheTest.java => SegmentBootstrapperCacheTest.java} (86%)
 create mode 100644 server/src/test/java/org/apache/druid/server/coordination/SegmentBootstrapperTest.java
 create mode 100644 server/src/test/java/org/apache/druid/server/coordination/TestSegmentCacheManager.java

diff --git a/server/src/main/java/org/apache/druid/server/coordination/ChangeRequestsSnapshot.java b/server/src/main/java/org/apache/druid/server/coordination/ChangeRequestsSnapshot.java
index 14113bed6b2..a86453df66d 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/ChangeRequestsSnapshot.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/ChangeRequestsSnapshot.java
@@ -24,7 +24,6 @@ import com.fasterxml.jackson.annotation.JsonProperty;
 import com.google.common.base.Preconditions;
 
 import javax.annotation.Nullable;
-
 import java.util.List;
 
 /**
diff --git a/server/src/main/java/org/apache/druid/server/coordination/SegmentBootstrapper.java b/server/src/main/java/org/apache/druid/server/coordination/SegmentBootstrapper.java
new file mode 100644
index 00000000000..c5b71fbcddc
--- /dev/null
+++ b/server/src/main/java/org/apache/druid/server/coordination/SegmentBootstrapper.java
@@ -0,0 +1,439 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.server.coordination;
+
+import com.google.common.base.Throwables;
+import com.google.common.collect.ImmutableList;
+import com.google.common.util.concurrent.SettableFuture;
+import com.google.inject.Inject;
+import org.apache.druid.client.BootstrapSegmentsResponse;
+import org.apache.druid.client.coordinator.CoordinatorClient;
+import org.apache.druid.common.guava.FutureUtils;
+import org.apache.druid.guice.ManageLifecycle;
+import org.apache.druid.guice.ServerTypeConfig;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.Stopwatch;
+import org.apache.druid.java.util.common.concurrent.Execs;
+import org.apache.druid.java.util.common.lifecycle.LifecycleStart;
+import org.apache.druid.java.util.common.lifecycle.LifecycleStop;
+import org.apache.druid.java.util.emitter.EmittingLogger;
+import org.apache.druid.java.util.emitter.service.ServiceEmitter;
+import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
+import org.apache.druid.segment.loading.SegmentLoaderConfig;
+import org.apache.druid.segment.loading.SegmentLoadingException;
+import org.apache.druid.server.SegmentManager;
+import org.apache.druid.timeline.DataSegment;
+
+import javax.annotation.Nullable;
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.List;
+import java.util.concurrent.CopyOnWriteArrayList;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.Executors;
+import java.util.concurrent.LinkedBlockingQueue;
+import java.util.concurrent.ScheduledExecutorService;
+import java.util.concurrent.ScheduledFuture;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicInteger;
+
+/**
+ * Responsible for bootstrapping segments already cached on disk and bootstrap segments fetched from the coordinator.
+ * Also responsible for announcing the node as a data server if applicable, once the bootstrapping operations
+ * are complete.
+ */
+@ManageLifecycle
+public class SegmentBootstrapper
+{
+  private final SegmentLoadDropHandler loadDropHandler;
+  private final SegmentLoaderConfig config;
+  private final DataSegmentAnnouncer segmentAnnouncer;
+  private final DataSegmentServerAnnouncer serverAnnouncer;
+  private final SegmentManager segmentManager;
+  private final ServerTypeConfig serverTypeConfig;
+  private final CoordinatorClient coordinatorClient;
+  private final ServiceEmitter emitter;
+
+  private volatile boolean isComplete = false;
+
+  // Synchronizes start/stop of this object.
+  private final Object startStopLock = new Object();
+
+  private static final EmittingLogger log = new EmittingLogger(SegmentBootstrapper.class);
+
+  @Inject
+  public SegmentBootstrapper(
+      SegmentLoadDropHandler loadDropHandler,
+      SegmentLoaderConfig config,
+      DataSegmentAnnouncer segmentAnnouncer,
+      DataSegmentServerAnnouncer serverAnnouncer,
+      SegmentManager segmentManager,
+      ServerTypeConfig serverTypeConfig,
+      CoordinatorClient coordinatorClient,
+      ServiceEmitter emitter
+  )
+  {
+    this.loadDropHandler = loadDropHandler;
+    this.config = config;
+    this.segmentAnnouncer = segmentAnnouncer;
+    this.serverAnnouncer = serverAnnouncer;
+    this.segmentManager = segmentManager;
+    this.serverTypeConfig = serverTypeConfig;
+    this.coordinatorClient = coordinatorClient;
+    this.emitter = emitter;
+  }
+
+  @LifecycleStart
+  public void start() throws IOException
+  {
+    synchronized (startStopLock) {
+      if (isComplete) {
+        return;
+      }
+
+      log.info("Starting...");
+      try {
+        if (segmentManager.canHandleSegments()) {
+          loadSegmentsOnStartup();
+        }
+
+        if (shouldAnnounce()) {
+          serverAnnouncer.announce();
+        }
+      }
+      catch (Exception e) {
+        Throwables.propagateIfPossible(e, IOException.class);
+        throw new RuntimeException(e);
+      }
+      isComplete = true;
+      log.info("Started.");
+    }
+  }
+
+  @LifecycleStop
+  public void stop()
+  {
+    synchronized (startStopLock) {
+      if (!isComplete) {
+        return;
+      }
+
+      log.info("Stopping...");
+      try {
+        if (shouldAnnounce()) {
+          serverAnnouncer.unannounce();
+        }
+      }
+      catch (Exception e) {
+        throw new RuntimeException(e);
+      }
+      finally {
+        isComplete = false;
+      }
+      log.info("Stopped.");
+    }
+  }
+
+  public boolean isBootstrappingComplete()
+  {
+    return isComplete;
+  }
+
+  /**
+   * Bulk loading of the following segments into the page cache at startup:
+   * <li> Previously cached segments </li>
+   * <li> Bootstrap segments from the coordinator </li>
+   */
+  private void loadSegmentsOnStartup() throws IOException
+  {
+    final List<DataSegment> segmentsOnStartup = new ArrayList<>();
+    segmentsOnStartup.addAll(segmentManager.getCachedSegments());
+    segmentsOnStartup.addAll(getBootstrapSegments());
+
+    final Stopwatch stopwatch = Stopwatch.createStarted();
+
+    // Start a temporary thread pool to load segments into page cache during bootstrap
+    final ExecutorService bootstrapExecutor = Execs.multiThreaded(
+        config.getNumBootstrapThreads(), "Segment-Bootstrap-%s"
+    );
+
+    // Start a temporary scheduled executor for background segment announcing
+    final ScheduledExecutorService backgroundAnnouncerExecutor = Executors.newScheduledThreadPool(
+        config.getNumLoadingThreads(), Execs.makeThreadFactory("Background-Segment-Announcer-%s")
+    );
+
+    try (final BackgroundSegmentAnnouncer backgroundSegmentAnnouncer =
+             new BackgroundSegmentAnnouncer(segmentAnnouncer, backgroundAnnouncerExecutor, config.getAnnounceIntervalMillis())) {
+
+      backgroundSegmentAnnouncer.startAnnouncing();
+
+      final int numSegments = segmentsOnStartup.size();
+      final CountDownLatch latch = new CountDownLatch(numSegments);
+      final AtomicInteger counter = new AtomicInteger(0);
+      final CopyOnWriteArrayList<DataSegment> failedSegments = new CopyOnWriteArrayList<>();
+      for (final DataSegment segment : segmentsOnStartup) {
+        bootstrapExecutor.submit(
+            () -> {
+              try {
+                log.info(
+                    "Loading segment[%d/%d][%s]",
+                    counter.incrementAndGet(), numSegments, segment.getId()
+                );
+                try {
+                  segmentManager.loadSegmentOnBootstrap(
+                      segment,
+                      () -> loadDropHandler.removeSegment(segment, DataSegmentChangeCallback.NOOP, false)
+                  );
+                }
+                catch (Exception e) {
+                  loadDropHandler.removeSegment(segment, DataSegmentChangeCallback.NOOP, false);
+                  throw new SegmentLoadingException(e, "Exception loading segment[%s]", segment.getId());
+                }
+                try {
+                  backgroundSegmentAnnouncer.announceSegment(segment);
+                }
+                catch (InterruptedException e) {
+                  Thread.currentThread().interrupt();
+                  throw new SegmentLoadingException(e, "Loading Interrupted");
+                }
+              }
+              catch (SegmentLoadingException e) {
+                log.error(e, "[%s] failed to load", segment.getId());
+                failedSegments.add(segment);
+              }
+              finally {
+                latch.countDown();
+              }
+            }
+        );
+      }
+
+      try {
+        latch.await();
+
+        if (failedSegments.size() > 0) {
+          log.makeAlert("[%,d] errors seen while loading segments on startup", failedSegments.size())
+             .addData("failedSegments", failedSegments)
+             .emit();
+        }
+      }
+      catch (InterruptedException e) {
+        Thread.currentThread().interrupt();
+        log.makeAlert(e, "LoadingInterrupted").emit();
+      }
+
+      backgroundSegmentAnnouncer.finishAnnouncing();
+    }
+    catch (SegmentLoadingException e) {
+      log.makeAlert(e, "Failed to load segments on startup -- likely problem with announcing.")
+         .addData("numSegments", segmentsOnStartup.size())
+         .emit();
+    }
+    finally {
+      bootstrapExecutor.shutdownNow();
+      backgroundAnnouncerExecutor.shutdownNow();
+      stopwatch.stop();
+      // At this stage, all tasks have been submitted, send a shutdown command to cleanup any resources alloted
+      // for the bootstrapping function.
+      segmentManager.shutdownBootstrap();
+      log.info("Loaded [%d] segments on startup in [%,d]ms.", segmentsOnStartup.size(), stopwatch.millisElapsed());
+    }
+  }
+
+  /**
+   * @return a list of bootstrap segments. When bootstrap segments cannot be found, an empty list is returned.
+   */
+  private List<DataSegment> getBootstrapSegments()
+  {
+    log.info("Fetching bootstrap segments from the coordinator.");
+    final Stopwatch stopwatch = Stopwatch.createStarted();
+
+    List<DataSegment> bootstrapSegments = new ArrayList<>();
+
+    try {
+      final BootstrapSegmentsResponse response =
+          FutureUtils.getUnchecked(coordinatorClient.fetchBootstrapSegments(), true);
+      bootstrapSegments = ImmutableList.copyOf(response.getIterator());
+    }
+    catch (Exception e) {
+      log.warn("Error fetching bootstrap segments from the coordinator: [%s]. ", e.getMessage());
+    }
+    finally {
+      stopwatch.stop();
+      final long fetchRunMillis = stopwatch.millisElapsed();
+      emitter.emit(new ServiceMetricEvent.Builder().setMetric("segment/bootstrap/time", fetchRunMillis));
+      emitter.emit(new ServiceMetricEvent.Builder().setMetric("segment/bootstrap/count", bootstrapSegments.size()));
+      log.info("Fetched [%d] bootstrap segments in [%d]ms.", bootstrapSegments.size(), fetchRunMillis);
+    }
+
+    return bootstrapSegments;
+  }
+
+  /**
+   * Returns whether or not we should announce ourselves as a data server using {@link DataSegmentServerAnnouncer}.
+   *
+   * Returns true if _either_:
+   *
+   * <li> Our {@link #serverTypeConfig} indicates we are a segment server. This is necessary for Brokers to be able
+   * to detect that we exist.</li>
+   * <li> The segment manager is able to handle segments. This is necessary for Coordinators to be able to
+   * assign segments to us.</li>
+   */
+  private boolean shouldAnnounce()
+  {
+    return serverTypeConfig.getServerType().isSegmentServer() || segmentManager.canHandleSegments();
+  }
+
+  private static class BackgroundSegmentAnnouncer implements AutoCloseable
+  {
+    private static final EmittingLogger log = new EmittingLogger(BackgroundSegmentAnnouncer.class);
+
+    private final int announceIntervalMillis;
+    private final DataSegmentAnnouncer segmentAnnouncer;
+    private final ScheduledExecutorService exec;
+    private final LinkedBlockingQueue<DataSegment> queue;
+    private final SettableFuture<Boolean> doneAnnouncing;
+
+    private final Object lock = new Object();
+
+    private volatile boolean finished = false;
+    @Nullable
+    private volatile ScheduledFuture startedAnnouncing = null;
+    @Nullable
+    private volatile ScheduledFuture nextAnnoucement = null;
+
+    BackgroundSegmentAnnouncer(
+        DataSegmentAnnouncer segmentAnnouncer,
+        ScheduledExecutorService exec,
+        int announceIntervalMillis
+    )
+    {
+      this.segmentAnnouncer = segmentAnnouncer;
+      this.exec = exec;
+      this.announceIntervalMillis = announceIntervalMillis;
+      this.queue = new LinkedBlockingQueue<>();
+      this.doneAnnouncing = SettableFuture.create();
+    }
+
+    public void announceSegment(final DataSegment segment) throws InterruptedException
+    {
+      if (finished) {
+        throw new ISE("Announce segment called after finishAnnouncing");
+      }
+      queue.put(segment);
+    }
+
+    public void startAnnouncing()
+    {
+      if (announceIntervalMillis <= 0) {
+        log.info("Skipping background segment announcing as announceIntervalMillis is [%d].", announceIntervalMillis);
+        return;
+      }
+
+      log.info("Starting background segment announcing task");
+
+      // schedule background announcing task
+      nextAnnoucement = startedAnnouncing = exec.schedule(
+          new Runnable()
+          {
+            @Override
+            public void run()
+            {
+              synchronized (lock) {
+                try {
+                  if (!(finished && queue.isEmpty())) {
+                    final List<DataSegment> segments = new ArrayList<>();
+                    queue.drainTo(segments);
+                    try {
+                      segmentAnnouncer.announceSegments(segments);
+                      nextAnnoucement = exec.schedule(this, announceIntervalMillis, TimeUnit.MILLISECONDS);
+                    }
+                    catch (IOException e) {
+                      doneAnnouncing.setException(
+                          new SegmentLoadingException(e, "Failed to announce segments[%s]", segments)
+                      );
+                    }
+                  } else {
+                    doneAnnouncing.set(true);
+                  }
+                }
+                catch (Exception e) {
+                  doneAnnouncing.setException(e);
+                }
+              }
+            }
+          },
+          announceIntervalMillis,
+          TimeUnit.MILLISECONDS
+      );
+    }
+
+    public void finishAnnouncing() throws SegmentLoadingException
+    {
+      synchronized (lock) {
+        finished = true;
+        // announce any remaining segments
+        try {
+          final List<DataSegment> segments = new ArrayList<>();
+          queue.drainTo(segments);
+          segmentAnnouncer.announceSegments(segments);
+        }
+        catch (Exception e) {
+          throw new SegmentLoadingException(e, "Failed to announce segments[%s]", queue);
+        }
+
+        // get any exception that may have been thrown in background announcing
+        try {
+          // check in case intervalMillis is <= 0
+          if (startedAnnouncing != null) {
+            startedAnnouncing.cancel(false);
+          }
+          // - if the task is waiting on the lock, then the queue will be empty by the time it runs
+          // - if the task just released it, then the lock ensures any exception is set in doneAnnouncing
+          if (doneAnnouncing.isDone()) {
+            doneAnnouncing.get();
+          }
+        }
+        catch (InterruptedException e) {
+          Thread.currentThread().interrupt();
+          throw new SegmentLoadingException(e, "Loading Interrupted");
+        }
+        catch (ExecutionException e) {
+          throw new SegmentLoadingException(e.getCause(), "Background Announcing Task Failed");
+        }
+      }
+      log.info("Completed background segment announcing");
+    }
+
+    @Override
+    public void close()
+    {
+      // stop background scheduling
+      synchronized (lock) {
+        finished = true;
+        if (nextAnnoucement != null) {
+          nextAnnoucement.cancel(false);
+        }
+      }
+    }
+  }
+}
diff --git a/server/src/main/java/org/apache/druid/server/coordination/SegmentChangeRequestDrop.java b/server/src/main/java/org/apache/druid/server/coordination/SegmentChangeRequestDrop.java
index c4229a02880..ddee89b9763 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/SegmentChangeRequestDrop.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/SegmentChangeRequestDrop.java
@@ -26,7 +26,6 @@ import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.timeline.DataSegment;
 
 import javax.annotation.Nullable;
-
 import java.util.Objects;
 
 /**
diff --git a/server/src/main/java/org/apache/druid/server/coordination/SegmentChangeRequestLoad.java b/server/src/main/java/org/apache/druid/server/coordination/SegmentChangeRequestLoad.java
index 130c7b50d80..1bb9997980c 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/SegmentChangeRequestLoad.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/SegmentChangeRequestLoad.java
@@ -26,7 +26,6 @@ import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.timeline.DataSegment;
 
 import javax.annotation.Nullable;
-
 import java.util.Objects;
 
 /**
diff --git a/server/src/main/java/org/apache/druid/server/coordination/SegmentLoadDropHandler.java b/server/src/main/java/org/apache/druid/server/coordination/SegmentLoadDropHandler.java
index 4a9086ab572..12462adab2f 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/SegmentLoadDropHandler.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/SegmentLoadDropHandler.java
@@ -20,28 +20,16 @@
 package org.apache.druid.server.coordination;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Throwables;
 import com.google.common.cache.Cache;
 import com.google.common.cache.CacheBuilder;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.Maps;
 import com.google.common.util.concurrent.AbstractFuture;
 import com.google.common.util.concurrent.ListenableFuture;
-import com.google.common.util.concurrent.SettableFuture;
 import com.google.inject.Inject;
-import org.apache.druid.client.BootstrapSegmentsResponse;
-import org.apache.druid.client.coordinator.CoordinatorClient;
-import org.apache.druid.common.guava.FutureUtils;
 import org.apache.druid.guice.ManageLifecycle;
-import org.apache.druid.guice.ServerTypeConfig;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.java.util.common.Stopwatch;
 import org.apache.druid.java.util.common.concurrent.Execs;
-import org.apache.druid.java.util.common.lifecycle.LifecycleStart;
-import org.apache.druid.java.util.common.lifecycle.LifecycleStop;
 import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
-import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.loading.SegmentLoadingException;
 import org.apache.druid.server.SegmentManager;
@@ -56,20 +44,13 @@ import java.util.LinkedHashSet;
 import java.util.List;
 import java.util.Map;
 import java.util.concurrent.ConcurrentSkipListSet;
-import java.util.concurrent.CopyOnWriteArrayList;
-import java.util.concurrent.CountDownLatch;
-import java.util.concurrent.ExecutionException;
-import java.util.concurrent.ExecutorService;
 import java.util.concurrent.Executors;
-import java.util.concurrent.LinkedBlockingQueue;
 import java.util.concurrent.ScheduledExecutorService;
-import java.util.concurrent.ScheduledFuture;
 import java.util.concurrent.TimeUnit;
-import java.util.concurrent.atomic.AtomicInteger;
 import java.util.concurrent.atomic.AtomicReference;
 
 /**
- *
+ * Responsible for loading and dropping of segments by a process that can serve segments.
  */
 @ManageLifecycle
 public class SegmentLoadDropHandler implements DataSegmentChangeHandler
@@ -79,20 +60,12 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
   // Synchronizes removals from segmentsToDelete
   private final Object segmentDeleteLock = new Object();
 
-  // Synchronizes start/stop of this object.
-  private final Object startStopLock = new Object();
-
   private final SegmentLoaderConfig config;
   private final DataSegmentAnnouncer announcer;
-  private final DataSegmentServerAnnouncer serverAnnouncer;
   private final SegmentManager segmentManager;
   private final ScheduledExecutorService exec;
-  private final ServerTypeConfig serverTypeConfig;
-  private final CoordinatorClient coordinatorClient;
-  private final ServiceEmitter emitter;
-  private final ConcurrentSkipListSet<DataSegment> segmentsToDelete;
 
-  private volatile boolean started = false;
+  private final ConcurrentSkipListSet<DataSegment> segmentsToDelete;
 
   // Keep history of load/drop request status in a LRU cache to maintain idempotency if same request shows up
   // again and to return status of a completed request. Maximum size of this cache must be significantly greater
@@ -108,25 +81,17 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
   public SegmentLoadDropHandler(
       SegmentLoaderConfig config,
       DataSegmentAnnouncer announcer,
-      DataSegmentServerAnnouncer serverAnnouncer,
-      SegmentManager segmentManager,
-      ServerTypeConfig serverTypeConfig,
-      CoordinatorClient coordinatorClient,
-      ServiceEmitter emitter
+      SegmentManager segmentManager
   )
   {
     this(
         config,
         announcer,
-        serverAnnouncer,
         segmentManager,
         Executors.newScheduledThreadPool(
             config.getNumLoadingThreads(),
             Execs.makeThreadFactory("SimpleDataSegmentChangeHandler-%s")
-        ),
-        serverTypeConfig,
-        coordinatorClient,
-        emitter
+        )
     );
   }
 
@@ -134,83 +99,19 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
   SegmentLoadDropHandler(
       SegmentLoaderConfig config,
       DataSegmentAnnouncer announcer,
-      DataSegmentServerAnnouncer serverAnnouncer,
       SegmentManager segmentManager,
-      ScheduledExecutorService exec,
-      ServerTypeConfig serverTypeConfig,
-      CoordinatorClient coordinatorClient,
-      ServiceEmitter emitter
+      ScheduledExecutorService exec
   )
   {
     this.config = config;
     this.announcer = announcer;
-    this.serverAnnouncer = serverAnnouncer;
     this.segmentManager = segmentManager;
     this.exec = exec;
-    this.serverTypeConfig = serverTypeConfig;
-    this.coordinatorClient = coordinatorClient;
-    this.emitter = emitter;
 
     this.segmentsToDelete = new ConcurrentSkipListSet<>();
     requestStatuses = CacheBuilder.newBuilder().maximumSize(config.getStatusQueueMaxSize()).initialCapacity(8).build();
   }
 
-  @LifecycleStart
-  public void start() throws IOException
-  {
-    synchronized (startStopLock) {
-      if (started) {
-        return;
-      }
-
-      log.info("Starting...");
-      try {
-        if (segmentManager.canHandleSegments()) {
-          loadSegmentsOnStartup();
-        }
-
-        if (shouldAnnounce()) {
-          serverAnnouncer.announce();
-        }
-      }
-      catch (Exception e) {
-        Throwables.propagateIfPossible(e, IOException.class);
-        throw new RuntimeException(e);
-      }
-      started = true;
-      log.info("Started.");
-    }
-  }
-
-  @LifecycleStop
-  public void stop()
-  {
-    synchronized (startStopLock) {
-      if (!started) {
-        return;
-      }
-
-      log.info("Stopping...");
-      try {
-        if (shouldAnnounce()) {
-          serverAnnouncer.unannounce();
-        }
-      }
-      catch (Exception e) {
-        throw new RuntimeException(e);
-      }
-      finally {
-        started = false;
-      }
-      log.info("Stopped.");
-    }
-  }
-
-  public boolean isStarted()
-  {
-    return started;
-  }
-
   public Map<String, Long> getAverageNumOfRowsPerSegmentForDatasource()
   {
     return segmentManager.getAverageRowCountForDatasource();
@@ -221,132 +122,6 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
     return segmentManager.getRowCountDistribution();
   }
 
-  /**
-   * Bulk loading of the following segments into the page cache at startup:
-   * <li> Previously cached segments </li>
-   * <li> Bootstrap segments from the coordinator </li>
-   */
-  private void loadSegmentsOnStartup() throws IOException
-  {
-    final List<DataSegment> segmentsOnStartup = new ArrayList<>();
-    segmentsOnStartup.addAll(segmentManager.getCachedSegments());
-    segmentsOnStartup.addAll(getBootstrapSegments());
-
-    final Stopwatch stopwatch = Stopwatch.createStarted();
-
-    // Start a temporary thread pool to load segments into page cache during bootstrap
-    final ExecutorService loadingExecutor = Execs.multiThreaded(
-        config.getNumBootstrapThreads(), "Segment-Load-Startup-%s"
-    );
-
-    try (final BackgroundSegmentAnnouncer backgroundSegmentAnnouncer =
-             new BackgroundSegmentAnnouncer(announcer, exec, config.getAnnounceIntervalMillis())) {
-
-      backgroundSegmentAnnouncer.startAnnouncing();
-
-      final int numSegments = segmentsOnStartup.size();
-      final CountDownLatch latch = new CountDownLatch(numSegments);
-      final AtomicInteger counter = new AtomicInteger(0);
-      final CopyOnWriteArrayList<DataSegment> failedSegments = new CopyOnWriteArrayList<>();
-      for (final DataSegment segment : segmentsOnStartup) {
-        loadingExecutor.submit(
-            () -> {
-              try {
-                log.info(
-                    "Loading segment[%d/%d][%s]",
-                    counter.incrementAndGet(), numSegments, segment.getId()
-                );
-                try {
-                  segmentManager.loadSegmentOnBootstrap(
-                      segment,
-                      () -> this.removeSegment(segment, DataSegmentChangeCallback.NOOP, false)
-                  );
-                }
-                catch (Exception e) {
-                  removeSegment(segment, DataSegmentChangeCallback.NOOP, false);
-                  throw new SegmentLoadingException(e, "Exception loading segment[%s]", segment.getId());
-                }
-                try {
-                  backgroundSegmentAnnouncer.announceSegment(segment);
-                }
-                catch (InterruptedException e) {
-                  Thread.currentThread().interrupt();
-                  throw new SegmentLoadingException(e, "Loading Interrupted");
-                }
-              }
-              catch (SegmentLoadingException e) {
-                log.error(e, "[%s] failed to load", segment.getId());
-                failedSegments.add(segment);
-              }
-              finally {
-                latch.countDown();
-              }
-            }
-        );
-      }
-
-      try {
-        latch.await();
-
-        if (failedSegments.size() > 0) {
-          log.makeAlert("[%,d] errors seen while loading segments on startup", failedSegments.size())
-             .addData("failedSegments", failedSegments)
-             .emit();
-        }
-      }
-      catch (InterruptedException e) {
-        Thread.currentThread().interrupt();
-        log.makeAlert(e, "LoadingInterrupted").emit();
-      }
-
-      backgroundSegmentAnnouncer.finishAnnouncing();
-    }
-    catch (SegmentLoadingException e) {
-      log.makeAlert(e, "Failed to load segments on startup -- likely problem with announcing.")
-         .addData("numSegments", segmentsOnStartup.size())
-         .emit();
-    }
-    finally {
-      loadingExecutor.shutdownNow();
-      stopwatch.stop();
-      // At this stage, all tasks have been submitted, send a shutdown command to cleanup any resources alloted
-      // for the bootstrapping function.
-      segmentManager.shutdownBootstrap();
-      log.info("Loaded [%d] segments on startup in [%,d]ms.", segmentsOnStartup.size(), stopwatch.millisElapsed());
-    }
-  }
-
-  /**
-   * @return a list of bootstrap segments. When bootstrap segments cannot be found, an empty list is returned.
-   */
-  private List<DataSegment> getBootstrapSegments()
-  {
-    log.info("Fetching bootstrap segments from the coordinator.");
-    final Stopwatch stopwatch = Stopwatch.createStarted();
-
-    List<DataSegment> bootstrapSegments = new ArrayList<>();
-
-    try {
-      final BootstrapSegmentsResponse response =
-          FutureUtils.getUnchecked(coordinatorClient.fetchBootstrapSegments(), true);
-      bootstrapSegments = ImmutableList.copyOf(response.getIterator());
-    }
-    catch (Exception e) {
-      // By default, we "fail open" when there is any error -- finding the coordinator, or if the API endpoint cannot
-      // be found during rolling upgrades, or even if it's irrecoverable.
-      log.warn("Error fetching bootstrap segments from the coordinator: [%s]. ", e.getMessage());
-    }
-    finally {
-      stopwatch.stop();
-      final long fetchRunMillis = stopwatch.millisElapsed();
-      emitter.emit(new ServiceMetricEvent.Builder().setMetric("segment/bootstrap/time", fetchRunMillis));
-      emitter.emit(new ServiceMetricEvent.Builder().setMetric("segment/bootstrap/count", bootstrapSegments.size()));
-      log.info("Fetched [%d] bootstrap segments in [%d]ms.", bootstrapSegments.size(), fetchRunMillis);
-    }
-
-    return bootstrapSegments;
-  }
-
   @Override
   public void addSegment(DataSegment segment, @Nullable DataSegmentChangeCallback callback)
   {
@@ -566,154 +341,6 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
     }
   }
 
-  /**
-   * Returns whether or not we should announce ourselves as a data server using {@link DataSegmentServerAnnouncer}.
-   *
-   * Returns true if _either_:
-   *
-   * <li> Our {@link #serverTypeConfig} indicates we are a segment server. This is necessary for Brokers to be able
-   * to detect that we exist.</li>
-   * <li> The segment manager is able to handle segments. This is necessary for Coordinators to be able to
-   * assign segments to us.</li>
-   */
-  private boolean shouldAnnounce()
-  {
-    return serverTypeConfig.getServerType().isSegmentServer() || segmentManager.canHandleSegments();
-  }
-
-  private static class BackgroundSegmentAnnouncer implements AutoCloseable
-  {
-    private static final EmittingLogger log = new EmittingLogger(BackgroundSegmentAnnouncer.class);
-
-    private final int intervalMillis;
-    private final DataSegmentAnnouncer announcer;
-    private final ScheduledExecutorService exec;
-    private final LinkedBlockingQueue<DataSegment> queue;
-    private final SettableFuture<Boolean> doneAnnouncing;
-
-    private final Object lock = new Object();
-
-    private volatile boolean finished = false;
-    @Nullable
-    private volatile ScheduledFuture startedAnnouncing = null;
-    @Nullable
-    private volatile ScheduledFuture nextAnnoucement = null;
-
-    public BackgroundSegmentAnnouncer(
-        DataSegmentAnnouncer announcer,
-        ScheduledExecutorService exec,
-        int intervalMillis
-    )
-    {
-      this.announcer = announcer;
-      this.exec = exec;
-      this.intervalMillis = intervalMillis;
-      this.queue = new LinkedBlockingQueue<>();
-      this.doneAnnouncing = SettableFuture.create();
-    }
-
-    public void announceSegment(final DataSegment segment) throws InterruptedException
-    {
-      if (finished) {
-        throw new ISE("Announce segment called after finishAnnouncing");
-      }
-      queue.put(segment);
-    }
-
-    public void startAnnouncing()
-    {
-      if (intervalMillis <= 0) {
-        return;
-      }
-
-      log.info("Starting background segment announcing task");
-
-      // schedule background announcing task
-      nextAnnoucement = startedAnnouncing = exec.schedule(
-          new Runnable()
-          {
-            @Override
-            public void run()
-            {
-              synchronized (lock) {
-                try {
-                  if (!(finished && queue.isEmpty())) {
-                    final List<DataSegment> segments = new ArrayList<>();
-                    queue.drainTo(segments);
-                    try {
-                      announcer.announceSegments(segments);
-                      nextAnnoucement = exec.schedule(this, intervalMillis, TimeUnit.MILLISECONDS);
-                    }
-                    catch (IOException e) {
-                      doneAnnouncing.setException(
-                          new SegmentLoadingException(e, "Failed to announce segments[%s]", segments)
-                      );
-                    }
-                  } else {
-                    doneAnnouncing.set(true);
-                  }
-                }
-                catch (Exception e) {
-                  doneAnnouncing.setException(e);
-                }
-              }
-            }
-          },
-          intervalMillis,
-          TimeUnit.MILLISECONDS
-      );
-    }
-
-    public void finishAnnouncing() throws SegmentLoadingException
-    {
-      synchronized (lock) {
-        finished = true;
-        // announce any remaining segments
-        try {
-          final List<DataSegment> segments = new ArrayList<>();
-          queue.drainTo(segments);
-          announcer.announceSegments(segments);
-        }
-        catch (Exception e) {
-          throw new SegmentLoadingException(e, "Failed to announce segments[%s]", queue);
-        }
-
-        // get any exception that may have been thrown in background announcing
-        try {
-          // check in case intervalMillis is <= 0
-          if (startedAnnouncing != null) {
-            startedAnnouncing.cancel(false);
-          }
-          // - if the task is waiting on the lock, then the queue will be empty by the time it runs
-          // - if the task just released it, then the lock ensures any exception is set in doneAnnouncing
-          if (doneAnnouncing.isDone()) {
-            doneAnnouncing.get();
-          }
-        }
-        catch (InterruptedException e) {
-          Thread.currentThread().interrupt();
-          throw new SegmentLoadingException(e, "Loading Interrupted");
-        }
-        catch (ExecutionException e) {
-          throw new SegmentLoadingException(e.getCause(), "Background Announcing Task Failed");
-        }
-      }
-      log.info("Completed background segment announcing");
-    }
-
-    @Override
-    public void close()
-    {
-      // stop background scheduling
-      synchronized (lock) {
-        finished = true;
-        if (nextAnnoucement != null) {
-          nextAnnoucement.cancel(false);
-        }
-      }
-    }
-  }
-
   // Future with cancel() implementation to remove it from "waitingFutures" list
   private class CustomSettableFuture extends AbstractFuture<List<DataSegmentChangeResponse>>
   {
@@ -759,6 +386,5 @@ public class SegmentLoadDropHandler implements DataSegmentChangeHandler
       return true;
     }
   }
-
 }
 
diff --git a/server/src/main/java/org/apache/druid/server/http/HistoricalResource.java b/server/src/main/java/org/apache/druid/server/http/HistoricalResource.java
index 4bc48f444df..223e1a2dea2 100644
--- a/server/src/main/java/org/apache/druid/server/http/HistoricalResource.java
+++ b/server/src/main/java/org/apache/druid/server/http/HistoricalResource.java
@@ -21,7 +21,7 @@ package org.apache.druid.server.http;
 
 import com.google.common.collect.ImmutableMap;
 import com.sun.jersey.spi.container.ResourceFilters;
-import org.apache.druid.server.coordination.SegmentLoadDropHandler;
+import org.apache.druid.server.coordination.SegmentBootstrapper;
 import org.apache.druid.server.http.security.StateResourceFilter;
 
 import javax.inject.Inject;
@@ -34,14 +34,14 @@ import javax.ws.rs.core.Response;
 @Path("/druid/historical/v1")
 public class HistoricalResource
 {
-  private final SegmentLoadDropHandler segmentLoadDropHandler;
+  private final SegmentBootstrapper segmentBootstrapper;
 
   @Inject
   public HistoricalResource(
-      SegmentLoadDropHandler segmentLoadDropHandler
+      SegmentBootstrapper segmentBootstrapper
   )
   {
-    this.segmentLoadDropHandler = segmentLoadDropHandler;
+    this.segmentBootstrapper = segmentBootstrapper;
   }
 
   @GET
@@ -50,14 +50,14 @@ public class HistoricalResource
   @Produces(MediaType.APPLICATION_JSON)
   public Response getLoadStatus()
   {
-    return Response.ok(ImmutableMap.of("cacheInitialized", segmentLoadDropHandler.isStarted())).build();
+    return Response.ok(ImmutableMap.of("cacheInitialized", segmentBootstrapper.isBootstrappingComplete())).build();
   }
 
   @GET
   @Path("/readiness")
   public Response getReadiness()
   {
-    if (segmentLoadDropHandler.isStarted()) {
+    if (segmentBootstrapper.isBootstrappingComplete()) {
       return Response.ok().build();
     } else {
       return Response.status(Response.Status.SERVICE_UNAVAILABLE).build();
diff --git a/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerCacheTest.java b/server/src/test/java/org/apache/druid/server/coordination/SegmentBootstrapperCacheTest.java
similarity index 86%
rename from server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerCacheTest.java
rename to server/src/test/java/org/apache/druid/server/coordination/SegmentBootstrapperCacheTest.java
index f6b1c39c59d..7629a6b875c 100644
--- a/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerCacheTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordination/SegmentBootstrapperCacheTest.java
@@ -50,10 +50,10 @@ import java.util.Collections;
 import java.util.List;
 
 /**
- * Similar to {@link SegmentLoadDropHandlerTest}. This class includes tests that cover the
+ * Similar to {@link SegmentBootstrapperTest}. This class includes tests that cover the
  * storage location layer as well.
  */
-public class SegmentLoadDropHandlerCacheTest
+public class SegmentBootstrapperCacheTest
 {
   private static final long MAX_SIZE = 1000L;
   private static final long SEGMENT_SIZE = 100L;
@@ -101,8 +101,8 @@ public class SegmentLoadDropHandlerCacheTest
         objectMapper
     );
     segmentManager = new SegmentManager(cacheManager);
-    segmentAnnouncer = new TestDataSegmentAnnouncer();
     serverAnnouncer = new TestDataServerAnnouncer();
+    segmentAnnouncer = new TestDataSegmentAnnouncer();
     coordinatorClient = new TestCoordinatorClient();
     emitter = new StubServiceEmitter();
     EmittingLogger.registerEmitter(emitter);
@@ -112,10 +112,11 @@ public class SegmentLoadDropHandlerCacheTest
   public void testLoadStartStopWithEmptyLocations() throws IOException
   {
     final List<StorageLocation> emptyLocations = ImmutableList.of();
+    final SegmentLoaderConfig loaderConfig = new SegmentLoaderConfig();
     segmentManager = new SegmentManager(
         new SegmentLocalCacheManager(
             emptyLocations,
-            new SegmentLoaderConfig(),
+            loaderConfig,
             new LeastBytesUsedStorageLocationSelectorStrategy(emptyLocations),
             TestIndex.INDEX_IO,
             objectMapper
@@ -123,19 +124,26 @@ public class SegmentLoadDropHandlerCacheTest
     );
 
     final SegmentLoadDropHandler loadDropHandler = new SegmentLoadDropHandler(
-        new SegmentLoaderConfig(),
+        loaderConfig,
+        segmentAnnouncer,
+        segmentManager
+    );
+
+    final SegmentBootstrapper bootstrapper = new SegmentBootstrapper(
+        loadDropHandler,
+        loaderConfig,
         segmentAnnouncer,
         serverAnnouncer,
         segmentManager,
-        new ServerTypeConfig(ServerType.BROKER),
+        new ServerTypeConfig(ServerType.HISTORICAL),
         coordinatorClient,
         emitter
     );
 
-    loadDropHandler.start();
-    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
+    bootstrapper.start();
+    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
 
-    loadDropHandler.stop();
+    bootstrapper.stop();
     Assert.assertEquals(0, serverAnnouncer.getObservedCount());
   }
 
@@ -143,19 +151,26 @@ public class SegmentLoadDropHandlerCacheTest
   public void testLoadStartStop() throws IOException
   {
     final SegmentLoadDropHandler loadDropHandler = new SegmentLoadDropHandler(
+        loaderConfig,
+        segmentAnnouncer,
+        segmentManager
+    );
+
+    final SegmentBootstrapper bootstrapper = new SegmentBootstrapper(
+        loadDropHandler,
         loaderConfig,
         segmentAnnouncer,
         serverAnnouncer,
         segmentManager,
-        new ServerTypeConfig(ServerType.BROKER),
+        new ServerTypeConfig(ServerType.HISTORICAL),
         coordinatorClient,
         emitter
     );
 
-    loadDropHandler.start();
+    bootstrapper.start();
     Assert.assertEquals(1, serverAnnouncer.getObservedCount());
 
-    loadDropHandler.stop();
+    bootstrapper.stop();
     Assert.assertEquals(0, serverAnnouncer.getObservedCount());
   }
 
@@ -176,6 +191,13 @@ public class SegmentLoadDropHandlerCacheTest
     }
 
     final SegmentLoadDropHandler loadDropHandler = new SegmentLoadDropHandler(
+        loaderConfig,
+        segmentAnnouncer,
+        segmentManager
+    );
+
+    final SegmentBootstrapper bootstrapper = new SegmentBootstrapper(
+        loadDropHandler,
         loaderConfig,
         segmentAnnouncer,
         serverAnnouncer,
@@ -185,8 +207,7 @@ public class SegmentLoadDropHandlerCacheTest
         emitter
     );
 
-    // Start the load drop handler
-    loadDropHandler.start();
+    bootstrapper.start();
     Assert.assertEquals(1, serverAnnouncer.getObservedCount());
 
     // Verify the expected announcements
@@ -202,7 +223,7 @@ public class SegmentLoadDropHandlerCacheTest
     loadDropHandler.addSegment(newSegment, null);
     Assert.assertTrue(segmentAnnouncer.getObservedSegments().contains(newSegment));
 
-    loadDropHandler.stop();
+    bootstrapper.stop();
     Assert.assertEquals(0, serverAnnouncer.getObservedCount());
   }
 }
diff --git a/server/src/test/java/org/apache/druid/server/coordination/SegmentBootstrapperTest.java b/server/src/test/java/org/apache/druid/server/coordination/SegmentBootstrapperTest.java
new file mode 100644
index 00000000000..c41763f1824
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/server/coordination/SegmentBootstrapperTest.java
@@ -0,0 +1,306 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.server.coordination;
+
+import com.google.common.collect.ImmutableList;
+import org.apache.druid.guice.ServerTypeConfig;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.emitter.EmittingLogger;
+import org.apache.druid.java.util.metrics.StubServiceEmitter;
+import org.apache.druid.segment.loading.SegmentLoaderConfig;
+import org.apache.druid.segment.loading.StorageLocationConfig;
+import org.apache.druid.server.SegmentManager;
+import org.apache.druid.timeline.DataSegment;
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Rule;
+import org.junit.Test;
+import org.junit.rules.TemporaryFolder;
+
+import java.io.File;
+import java.io.IOException;
+import java.util.Collections;
+import java.util.HashSet;
+import java.util.List;
+import java.util.Set;
+
+import static org.apache.druid.server.TestSegmentUtils.makeSegment;
+
+public class SegmentBootstrapperTest
+{
+  private static final int COUNT = 50;
+
+  private TestDataSegmentAnnouncer segmentAnnouncer;
+  private TestDataServerAnnouncer serverAnnouncer;
+  private SegmentLoaderConfig segmentLoaderConfig;
+  private TestCoordinatorClient coordinatorClient;
+  private StubServiceEmitter serviceEmitter;
+
+  @Rule
+  public TemporaryFolder temporaryFolder = new TemporaryFolder();
+
+  @Before
+  public void setUp() throws IOException
+  {
+    final File segmentCacheDir = temporaryFolder.newFolder();
+
+    segmentAnnouncer = new TestDataSegmentAnnouncer();
+    serverAnnouncer = new TestDataServerAnnouncer();
+    segmentLoaderConfig = new SegmentLoaderConfig()
+    {
+      @Override
+      public File getInfoDir()
+      {
+        return segmentCacheDir;
+      }
+
+      @Override
+      public int getNumLoadingThreads()
+      {
+        return 5;
+      }
+
+      @Override
+      public int getAnnounceIntervalMillis()
+      {
+        return 50;
+      }
+
+      @Override
+      public List<StorageLocationConfig> getLocations()
+      {
+        return Collections.singletonList(
+            new StorageLocationConfig(segmentCacheDir, null, null)
+        );
+      }
+    };
+
+    coordinatorClient = new TestCoordinatorClient();
+    serviceEmitter = new StubServiceEmitter();
+    EmittingLogger.registerEmitter(serviceEmitter);
+  }
+
+
+  @Test
+  public void testStartStop() throws Exception
+  {
+    final Set<DataSegment> segments = new HashSet<>();
+    for (int i = 0; i < COUNT; ++i) {
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-01")));
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-02")));
+      segments.add(makeSegment("test" + i, "2", Intervals.of("P1d/2011-04-02")));
+      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-01")));
+      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-02")));
+    }
+
+    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager(segments);
+    final SegmentManager segmentManager = new SegmentManager(cacheManager);
+    final SegmentLoadDropHandler handler = new SegmentLoadDropHandler(
+        segmentLoaderConfig,
+        segmentAnnouncer,
+        segmentManager
+    );
+    final SegmentBootstrapper bootstrapper = new SegmentBootstrapper(
+        handler,
+        segmentLoaderConfig,
+        segmentAnnouncer,
+        serverAnnouncer,
+        segmentManager,
+        new ServerTypeConfig(ServerType.HISTORICAL),
+        coordinatorClient,
+        serviceEmitter
+    );
+
+    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
+    bootstrapper.start();
+
+    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
+    Assert.assertFalse(segmentManager.getDataSourceCounts().isEmpty());
+
+    for (int i = 0; i < COUNT; ++i) {
+      Assert.assertEquals(3L, segmentManager.getDataSourceCounts().get("test" + i).longValue());
+      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test_two" + i).longValue());
+    }
+
+    Assert.assertEquals(ImmutableList.copyOf(segments), segmentAnnouncer.getObservedSegments());
+
+    final ImmutableList<DataSegment> expectedBootstrapSegments = ImmutableList.copyOf(segments);
+    Assert.assertEquals(expectedBootstrapSegments, cacheManager.getObservedBootstrapSegments());
+    Assert.assertEquals(expectedBootstrapSegments, cacheManager.getObservedBootstrapSegmentsLoadedIntoPageCache());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedSegments());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedSegmentsLoadedIntoPageCache());
+
+    bootstrapper.stop();
+
+    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
+    Assert.assertEquals(1, cacheManager.getObservedShutdownBootstrapCount().get());
+  }
+
+  @Test
+  public void testLoadCachedSegments() throws Exception
+  {
+    final Set<DataSegment> segments = new HashSet<>();
+    for (int i = 0; i < COUNT; ++i) {
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-01")));
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-02")));
+      segments.add(makeSegment("test" + i, "2", Intervals.of("P1d/2011-04-02")));
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-03")));
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-04")));
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-05")));
+      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T01")));
+      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T02")));
+      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T03")));
+      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T05")));
+      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T06")));
+      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-01")));
+      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-02")));
+    }
+
+    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager(segments);
+    final SegmentManager segmentManager = new SegmentManager(cacheManager);
+    final SegmentLoadDropHandler handler = new SegmentLoadDropHandler(segmentLoaderConfig, segmentAnnouncer, segmentManager);
+    final SegmentBootstrapper bootstrapper = new SegmentBootstrapper(
+        handler,
+        segmentLoaderConfig,
+        segmentAnnouncer,
+        serverAnnouncer,
+        segmentManager,
+        new ServerTypeConfig(ServerType.HISTORICAL),
+        coordinatorClient,
+        serviceEmitter
+    );
+
+    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
+
+    bootstrapper.start();
+
+    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
+    Assert.assertFalse(segmentManager.getDataSourceCounts().isEmpty());
+
+    for (int i = 0; i < COUNT; ++i) {
+      Assert.assertEquals(11L, segmentManager.getDataSourceCounts().get("test" + i).longValue());
+      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test_two" + i).longValue());
+    }
+
+    Assert.assertEquals(ImmutableList.copyOf(segments), segmentAnnouncer.getObservedSegments());
+
+    final ImmutableList<DataSegment> expectedBootstrapSegments = ImmutableList.copyOf(segments);
+    Assert.assertEquals(expectedBootstrapSegments, cacheManager.getObservedBootstrapSegments());
+    Assert.assertEquals(expectedBootstrapSegments, cacheManager.getObservedBootstrapSegmentsLoadedIntoPageCache());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedSegments());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedSegmentsLoadedIntoPageCache());
+
+    bootstrapper.stop();
+
+    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
+    Assert.assertEquals(1, cacheManager.getObservedShutdownBootstrapCount().get());
+  }
+
+  @Test
+  public void testLoadBootstrapSegments() throws Exception
+  {
+    final Set<DataSegment> segments = new HashSet<>();
+    for (int i = 0; i < COUNT; ++i) {
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-01")));
+      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-02")));
+      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-01")));
+      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-02")));
+    }
+
+    final TestCoordinatorClient coordinatorClient = new TestCoordinatorClient(segments);
+    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager();
+    final SegmentManager segmentManager = new SegmentManager(cacheManager);
+    final SegmentLoadDropHandler handler = new SegmentLoadDropHandler(
+        segmentLoaderConfig,
+        segmentAnnouncer,
+        segmentManager
+    );
+    final SegmentBootstrapper bootstrapper = new SegmentBootstrapper(
+        handler,
+        segmentLoaderConfig,
+        segmentAnnouncer,
+        serverAnnouncer,
+        segmentManager,
+        new ServerTypeConfig(ServerType.HISTORICAL),
+        coordinatorClient,
+        serviceEmitter
+    );
+
+    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
+
+    bootstrapper.start();
+
+    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
+    Assert.assertFalse(segmentManager.getDataSourceCounts().isEmpty());
+
+    for (int i = 0; i < COUNT; ++i) {
+      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test" + i).longValue());
+      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test_two" + i).longValue());
+    }
+
+    final ImmutableList<DataSegment> expectedBootstrapSegments = ImmutableList.copyOf(segments);
+
+    Assert.assertEquals(expectedBootstrapSegments, segmentAnnouncer.getObservedSegments());
+
+    Assert.assertEquals(expectedBootstrapSegments, cacheManager.getObservedBootstrapSegments());
+    Assert.assertEquals(expectedBootstrapSegments, cacheManager.getObservedBootstrapSegmentsLoadedIntoPageCache());
+    serviceEmitter.verifyValue("segment/bootstrap/count", expectedBootstrapSegments.size());
+    serviceEmitter.verifyEmitted("segment/bootstrap/time", 1);
+
+    bootstrapper.stop();
+  }
+
+  @Test
+  public void testLoadBootstrapSegmentsWhenExceptionThrown() throws Exception
+  {
+    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager();
+    final SegmentManager segmentManager = new SegmentManager(cacheManager);
+    final SegmentLoadDropHandler handler = new SegmentLoadDropHandler(
+        segmentLoaderConfig,
+        segmentAnnouncer,
+        segmentManager
+    );
+    final SegmentBootstrapper bootstrapper = new SegmentBootstrapper(
+        handler,
+        segmentLoaderConfig,
+        segmentAnnouncer,
+        serverAnnouncer,
+        segmentManager,
+        new ServerTypeConfig(ServerType.HISTORICAL),
+        coordinatorClient,
+        serviceEmitter
+    );
+
+    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
+
+    bootstrapper.start();
+
+    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
+    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
+
+    Assert.assertEquals(ImmutableList.of(), segmentAnnouncer.getObservedSegments());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedBootstrapSegments());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedBootstrapSegmentsLoadedIntoPageCache());
+    serviceEmitter.verifyValue("segment/bootstrap/count", 0);
+    serviceEmitter.verifyEmitted("segment/bootstrap/time", 1);
+
+    bootstrapper.stop();
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerTest.java b/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerTest.java
index 9fe04d60d5b..cd2fe2dbd63 100644
--- a/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordination/SegmentLoadDropHandlerTest.java
@@ -20,33 +20,21 @@
 package org.apache.druid.server.coordination;
 
 import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableSet;
 import com.google.common.util.concurrent.ListenableFuture;
-import org.apache.druid.client.coordinator.CoordinatorClient;
-import org.apache.druid.client.coordinator.NoopCoordinatorClient;
-import org.apache.druid.guice.ServerTypeConfig;
 import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.java.util.common.MapUtils;
 import org.apache.druid.java.util.common.concurrent.Execs;
 import org.apache.druid.java.util.common.concurrent.ScheduledExecutorFactory;
 import org.apache.druid.java.util.emitter.EmittingLogger;
 import org.apache.druid.java.util.metrics.StubServiceEmitter;
-import org.apache.druid.segment.ReferenceCountingSegment;
-import org.apache.druid.segment.SegmentLazyLoadFailCallback;
-import org.apache.druid.segment.loading.NoopSegmentCacheManager;
 import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.segment.loading.StorageLocationConfig;
-import org.apache.druid.segment.loading.TombstoneSegmentizerFactory;
 import org.apache.druid.server.SegmentManager;
-import org.apache.druid.server.TestSegmentUtils;
 import org.apache.druid.server.coordination.SegmentChangeStatus.State;
 import org.apache.druid.timeline.DataSegment;
-import org.joda.time.Interval;
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Rule;
 import org.junit.Test;
-import org.junit.rules.ExpectedException;
 import org.junit.rules.TemporaryFolder;
 import org.mockito.ArgumentMatchers;
 import org.mockito.Mockito;
@@ -56,29 +44,20 @@ import java.io.IOException;
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.HashMap;
-import java.util.HashSet;
 import java.util.List;
 import java.util.Map;
-import java.util.Set;
 import java.util.concurrent.ScheduledFuture;
 import java.util.concurrent.ScheduledThreadPoolExecutor;
 import java.util.concurrent.TimeUnit;
-import java.util.concurrent.atomic.AtomicInteger;
+
+import static org.apache.druid.server.TestSegmentUtils.makeSegment;
 
 public class SegmentLoadDropHandlerTest
 {
-  private static final int COUNT = 50;
-
   private TestDataSegmentAnnouncer segmentAnnouncer;
-  private TestDataServerAnnouncer serverAnnouncer;
   private List<Runnable> scheduledRunnable;
   private SegmentLoaderConfig segmentLoaderConfig;
   private ScheduledExecutorFactory scheduledExecutorFactory;
-  private TestCoordinatorClient coordinatorClient;
-  private StubServiceEmitter serviceEmitter;
-
-  @Rule
-  public ExpectedException expectedException = ExpectedException.none();
 
   @Rule
   public TemporaryFolder temporaryFolder = new TemporaryFolder();
@@ -90,7 +69,6 @@ public class SegmentLoadDropHandlerTest
 
     scheduledRunnable = new ArrayList<>();
     segmentAnnouncer = new TestDataSegmentAnnouncer();
-    serverAnnouncer = new TestDataServerAnnouncer();
     segmentLoaderConfig = new SegmentLoaderConfig()
     {
       @Override
@@ -140,9 +118,7 @@ public class SegmentLoadDropHandlerTest
       };
     };
 
-    coordinatorClient = new TestCoordinatorClient();
-    serviceEmitter = new StubServiceEmitter();
-    EmittingLogger.registerEmitter(serviceEmitter);
+    EmittingLogger.registerEmitter(new StubServiceEmitter());
   }
 
   /**
@@ -154,16 +130,12 @@ public class SegmentLoadDropHandlerTest
    * </ul>
    */
   @Test
-  public void testSegmentLoading1() throws Exception
+  public void testSegmentLoading1()
   {
     final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager();
     final SegmentManager segmentManager = new SegmentManager(cacheManager);
     final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager);
 
-    handler.start();
-
-    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
-
     final DataSegment segment = makeSegment("test", "1", Intervals.of("P1d/2011-04-01"));
 
     handler.removeSegment(segment, DataSegmentChangeCallback.NOOP);
@@ -178,19 +150,16 @@ public class SegmentLoadDropHandlerTest
     for (Runnable runnable : scheduledRunnable) {
       runnable.run();
     }
-    Assert.assertEquals(ImmutableList.of(segment), cacheManager.observedSegments);
-    Assert.assertEquals(ImmutableList.of(segment), cacheManager.observedSegmentsLoadedIntoPageCache);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegments);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegmentsLoadedIntoPageCache);
+    Assert.assertEquals(ImmutableList.of(segment), cacheManager.getObservedSegments());
+    Assert.assertEquals(ImmutableList.of(segment), cacheManager.getObservedSegmentsLoadedIntoPageCache());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedBootstrapSegments());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedBootstrapSegmentsLoadedIntoPageCache());
 
     Assert.assertEquals(ImmutableList.of(segment), segmentAnnouncer.getObservedSegments());
     Assert.assertFalse(
         "segment files shouldn't be deleted",
-        cacheManager.observedSegmentsRemovedFromCache.contains(segment)
+        cacheManager.getObservedSegmentsRemovedFromCache().contains(segment)
     );
-
-    handler.stop();
-    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
   }
 
   /**
@@ -203,15 +172,15 @@ public class SegmentLoadDropHandlerTest
    * </ul>
    */
   @Test
-  public void testSegmentLoading2() throws Exception
+  public void testSegmentLoading2()
   {
     final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager();
     final SegmentManager segmentManager = new SegmentManager(cacheManager);
     final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager);
 
-    handler.start();
+    // handler.start();
 
-    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
+    // Assert.assertEquals(1, serverAnnouncer.getObservedCount());
 
     final DataSegment segment = makeSegment("test", "1", Intervals.of("P1d/2011-04-01"));
 
@@ -234,176 +203,16 @@ public class SegmentLoadDropHandlerTest
 
     // The same segment reference will be fetched more than once in the above sequence, but the segment should
     // be loaded only once onto the page cache.
-    Assert.assertEquals(ImmutableList.of(segment, segment), cacheManager.observedSegments);
-    Assert.assertEquals(ImmutableList.of(segment), cacheManager.observedSegmentsLoadedIntoPageCache);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegments);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegmentsLoadedIntoPageCache);
+    Assert.assertEquals(ImmutableList.of(segment, segment), cacheManager.getObservedSegments());
+    Assert.assertEquals(ImmutableList.of(segment), cacheManager.getObservedSegmentsLoadedIntoPageCache());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedBootstrapSegments());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedBootstrapSegmentsLoadedIntoPageCache());
 
     Assert.assertTrue(segmentAnnouncer.getObservedSegments().contains(segment));
     Assert.assertFalse(
         "segment files shouldn't be deleted",
-        cacheManager.observedSegmentsRemovedFromCache.contains(segment)
+        cacheManager.getObservedSegmentsRemovedFromCache().contains(segment)
     );
-
-    handler.stop();
-    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
-  }
-
-  @Test
-  public void testLoadCache() throws Exception
-  {
-    Set<DataSegment> segments = new HashSet<>();
-    for (int i = 0; i < COUNT; ++i) {
-      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-01")));
-      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-02")));
-      segments.add(makeSegment("test" + i, "2", Intervals.of("P1d/2011-04-02")));
-      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-03")));
-      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-04")));
-      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-05")));
-      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T01")));
-      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T02")));
-      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T03")));
-      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T05")));
-      segments.add(makeSegment("test" + i, "2", Intervals.of("PT1h/2011-04-04T06")));
-      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-01")));
-      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-02")));
-    }
-
-    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager(segments);
-    final SegmentManager segmentManager = new SegmentManager(cacheManager);
-    final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager);
-
-    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
-
-    handler.start();
-
-    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
-    Assert.assertFalse(segmentManager.getDataSourceCounts().isEmpty());
-
-    for (int i = 0; i < COUNT; ++i) {
-      Assert.assertEquals(11L, segmentManager.getDataSourceCounts().get("test" + i).longValue());
-      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test_two" + i).longValue());
-    }
-
-    Assert.assertEquals(ImmutableList.copyOf(segments), segmentAnnouncer.getObservedSegments());
-
-    final ImmutableList<DataSegment> expectedBootstrapSegments = ImmutableList.copyOf(segments);
-    Assert.assertEquals(expectedBootstrapSegments, cacheManager.observedBootstrapSegments);
-    Assert.assertEquals(expectedBootstrapSegments, cacheManager.observedBootstrapSegmentsLoadedIntoPageCache);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedSegments);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedSegmentsLoadedIntoPageCache);
-
-    handler.stop();
-
-    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
-    Assert.assertEquals(1, cacheManager.observedShutdownBootstrapCount.get());
-  }
-
-  @Test
-  public void testLoadBootstrapSegments() throws Exception
-  {
-    final Set<DataSegment> segments = new HashSet<>();
-    for (int i = 0; i < COUNT; ++i) {
-      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-01")));
-      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-02")));
-      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-01")));
-      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-02")));
-    }
-
-    final TestCoordinatorClient coordinatorClient = new TestCoordinatorClient(segments);
-    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager();
-    final SegmentManager segmentManager = new SegmentManager(cacheManager);
-
-    final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager, coordinatorClient);
-
-    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
-
-    handler.start();
-
-    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
-    Assert.assertFalse(segmentManager.getDataSourceCounts().isEmpty());
-
-    for (int i = 0; i < COUNT; ++i) {
-      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test" + i).longValue());
-      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test_two" + i).longValue());
-    }
-
-    final ImmutableList<DataSegment> expectedBootstrapSegments = ImmutableList.copyOf(segments);
-
-    Assert.assertEquals(expectedBootstrapSegments, segmentAnnouncer.getObservedSegments());
-
-    Assert.assertEquals(expectedBootstrapSegments, cacheManager.observedBootstrapSegments);
-    Assert.assertEquals(expectedBootstrapSegments, cacheManager.observedBootstrapSegmentsLoadedIntoPageCache);
-    serviceEmitter.verifyValue("segment/bootstrap/count", expectedBootstrapSegments.size());
-    serviceEmitter.verifyEmitted("segment/bootstrap/time", 1);
-
-    handler.stop();
-  }
-
-  @Test
-  public void testLoadBootstrapSegmentsWhenExceptionThrown() throws Exception
-  {
-    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager();
-    final SegmentManager segmentManager = new SegmentManager(cacheManager);
-
-    final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager, new NoopCoordinatorClient());
-
-    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
-
-    handler.start();
-
-    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
-    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
-
-    Assert.assertEquals(ImmutableList.of(), segmentAnnouncer.getObservedSegments());
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegments);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegmentsLoadedIntoPageCache);
-    serviceEmitter.verifyValue("segment/bootstrap/count", 0);
-    serviceEmitter.verifyEmitted("segment/bootstrap/time", 1);
-
-    handler.stop();
-  }
-
-  @Test
-  public void testStartStop() throws Exception
-  {
-    final Set<DataSegment> segments = new HashSet<>();
-    for (int i = 0; i < COUNT; ++i) {
-      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-01")));
-      segments.add(makeSegment("test" + i, "1", Intervals.of("P1d/2011-04-02")));
-      segments.add(makeSegment("test" + i, "2", Intervals.of("P1d/2011-04-02")));
-      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-01")));
-      segments.add(makeSegment("test_two" + i, "1", Intervals.of("P1d/2011-04-02")));
-    }
-
-    final TestSegmentCacheManager cacheManager = new TestSegmentCacheManager(segments);
-    final SegmentManager segmentManager = new SegmentManager(cacheManager);
-    final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager);
-
-    Assert.assertTrue(segmentManager.getDataSourceCounts().isEmpty());
-
-    handler.start();
-
-    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
-    Assert.assertFalse(segmentManager.getDataSourceCounts().isEmpty());
-
-    for (int i = 0; i < COUNT; ++i) {
-      Assert.assertEquals(3L, segmentManager.getDataSourceCounts().get("test" + i).longValue());
-      Assert.assertEquals(2L, segmentManager.getDataSourceCounts().get("test_two" + i).longValue());
-    }
-
-    Assert.assertEquals(ImmutableList.copyOf(segments), segmentAnnouncer.getObservedSegments());
-
-    final ImmutableList<DataSegment> expectedBootstrapSegments = ImmutableList.copyOf(segments);
-    Assert.assertEquals(expectedBootstrapSegments, cacheManager.observedBootstrapSegments);
-    Assert.assertEquals(expectedBootstrapSegments, cacheManager.observedBootstrapSegmentsLoadedIntoPageCache);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedSegments);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedSegmentsLoadedIntoPageCache);
-
-    handler.stop();
-
-    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
-    Assert.assertEquals(1, cacheManager.observedShutdownBootstrapCount.get());
   }
 
   @Test(timeout = 60_000L)
@@ -413,10 +222,6 @@ public class SegmentLoadDropHandlerTest
     final SegmentManager segmentManager = new SegmentManager(cacheManager);
     final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager);
 
-    handler.start();
-
-    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
-
     DataSegment segment1 = makeSegment("batchtest1", "1", Intervals.of("P1d/2011-04-01"));
     DataSegment segment2 = makeSegment("batchtest2", "1", Intervals.of("P1d/2011-04-01"));
 
@@ -445,13 +250,10 @@ public class SegmentLoadDropHandlerTest
     Assert.assertEquals(ImmutableList.of(segment1), segmentAnnouncer.getObservedSegments());
 
     final ImmutableList<DataSegment> expectedSegments = ImmutableList.of(segment1);
-    Assert.assertEquals(expectedSegments, cacheManager.observedSegments);
-    Assert.assertEquals(expectedSegments, cacheManager.observedSegmentsLoadedIntoPageCache);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegments);
-    Assert.assertEquals(ImmutableList.of(), cacheManager.observedBootstrapSegmentsLoadedIntoPageCache);
-
-    handler.stop();
-    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
+    Assert.assertEquals(expectedSegments, cacheManager.getObservedSegments());
+    Assert.assertEquals(expectedSegments, cacheManager.getObservedSegmentsLoadedIntoPageCache());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedBootstrapSegments());
+    Assert.assertEquals(ImmutableList.of(), cacheManager.getObservedBootstrapSegmentsLoadedIntoPageCache());
   }
 
   @Test(timeout = 60_000L)
@@ -465,9 +267,6 @@ public class SegmentLoadDropHandlerTest
 
     final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(segmentManager);
 
-    handler.start();
-
-    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
 
     DataSegment segment1 = makeSegment("batchtest1", "1", Intervals.of("P1d/2011-04-01"));
     List<DataSegmentChangeRequest> batch = ImmutableList.of(new SegmentChangeRequestLoad(segment1));
@@ -489,8 +288,6 @@ public class SegmentLoadDropHandlerTest
     Assert.assertEquals(State.SUCCESS, result.get(0).getStatus().getState());
     Assert.assertEquals(ImmutableList.of(segment1, segment1), segmentAnnouncer.getObservedSegments());
 
-    handler.stop();
-    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
   }
 
   @Test(timeout = 60_000L)
@@ -538,13 +335,9 @@ public class SegmentLoadDropHandlerTest
 
     final SegmentLoadDropHandler handler = initSegmentLoadDropHandler(
         noAnnouncerSegmentLoaderConfig,
-        segmentManager,
-        coordinatorClient
+        segmentManager
     );
 
-    handler.start();
-
-    Assert.assertEquals(1, serverAnnouncer.getObservedCount());
 
     final DataSegment segment1 = makeSegment("batchtest1", "1", Intervals.of("P1d/2011-04-01"));
     List<DataSegmentChangeRequest> batch = ImmutableList.of(new SegmentChangeRequestLoad(segment1));
@@ -611,149 +404,23 @@ public class SegmentLoadDropHandlerTest
     Mockito.verify(segmentManager, Mockito.times(1))
            .dropSegment(ArgumentMatchers.any());
 
-    handler.stop();
-    Assert.assertEquals(0, serverAnnouncer.getObservedCount());
-  }
-
-  private SegmentLoadDropHandler initSegmentLoadDropHandler(SegmentManager segmentManager, CoordinatorClient coordinatorClient)
-  {
-    return initSegmentLoadDropHandler(segmentLoaderConfig, segmentManager, coordinatorClient);
   }
 
   private SegmentLoadDropHandler initSegmentLoadDropHandler(SegmentManager segmentManager)
   {
-    return initSegmentLoadDropHandler(segmentLoaderConfig, segmentManager, coordinatorClient);
+    return initSegmentLoadDropHandler(segmentLoaderConfig, segmentManager);
   }
 
   private SegmentLoadDropHandler initSegmentLoadDropHandler(
       SegmentLoaderConfig config,
-      SegmentManager segmentManager,
-      CoordinatorClient coordinatorClient
+      SegmentManager segmentManager
   )
   {
     return new SegmentLoadDropHandler(
         config,
         segmentAnnouncer,
-        serverAnnouncer,
         segmentManager,
-        scheduledExecutorFactory.create(5, "SegmentLoadDropHandlerTest-[%d]"),
-        new ServerTypeConfig(ServerType.HISTORICAL),
-        coordinatorClient,
-        serviceEmitter
+        scheduledExecutorFactory.create(5, "SegmentLoadDropHandlerTest-[%d]")
     );
   }
-
-  private DataSegment makeSegment(String dataSource, String version, Interval interval)
-  {
-    return TestSegmentUtils.makeSegment(dataSource, version, interval);
-  }
-
-  /**
-   * A local cache manager to test the bootstrapping and segment add/remove operations. It stubs only the necessary
-   * methods to support these operations; any other method invoked will throw an exception from the base class,
-   * {@link NoopSegmentCacheManager}.
-   */
-  private static class TestSegmentCacheManager extends NoopSegmentCacheManager
-  {
-    private final List<DataSegment> cachedSegments;
-
-    private final List<DataSegment> observedBootstrapSegments;
-    private final List<DataSegment> observedBootstrapSegmentsLoadedIntoPageCache;
-    private final List<DataSegment> observedSegments;
-    private final List<DataSegment> observedSegmentsLoadedIntoPageCache;
-    private final List<DataSegment> observedSegmentsRemovedFromCache;
-    private final AtomicInteger observedShutdownBootstrapCount;
-
-    TestSegmentCacheManager()
-    {
-      this(ImmutableSet.of());
-    }
-
-    TestSegmentCacheManager(final Set<DataSegment> segmentsToCache)
-    {
-      this.cachedSegments = ImmutableList.copyOf(segmentsToCache);
-      this.observedBootstrapSegments = new ArrayList<>();
-      this.observedBootstrapSegmentsLoadedIntoPageCache = new ArrayList<>();
-      this.observedSegments = new ArrayList<>();
-      this.observedSegmentsLoadedIntoPageCache = new ArrayList<>();
-      this.observedSegmentsRemovedFromCache = new ArrayList<>();
-      this.observedShutdownBootstrapCount = new AtomicInteger(0);
-    }
-
-    @Override
-    public boolean canHandleSegments()
-    {
-      return true;
-    }
-
-    @Override
-    public List<DataSegment> getCachedSegments()
-    {
-      return cachedSegments;
-    }
-
-    @Override
-    public ReferenceCountingSegment getBootstrapSegment(DataSegment segment, SegmentLazyLoadFailCallback loadFailed)
-    {
-      observedBootstrapSegments.add(segment);
-      return getSegmentInternal(segment);
-    }
-
-    @Override
-    public ReferenceCountingSegment getSegment(final DataSegment segment)
-    {
-      observedSegments.add(segment);
-      return getSegmentInternal(segment);
-    }
-
-    private ReferenceCountingSegment getSegmentInternal(final DataSegment segment)
-    {
-      if (segment.isTombstone()) {
-        return ReferenceCountingSegment
-            .wrapSegment(TombstoneSegmentizerFactory.segmentForTombstone(segment), segment.getShardSpec());
-      } else {
-        return ReferenceCountingSegment.wrapSegment(
-            new TestSegmentUtils.SegmentForTesting(
-                segment.getDataSource(),
-                (Interval) segment.getLoadSpec().get("interval"),
-                MapUtils.getString(segment.getLoadSpec(), "version")
-            ), segment.getShardSpec()
-        );
-      }
-    }
-
-    @Override
-    public void loadSegmentIntoPageCache(DataSegment segment)
-    {
-      observedSegmentsLoadedIntoPageCache.add(segment);
-    }
-
-    @Override
-    public void loadSegmentIntoPageCacheOnBootstrap(DataSegment segment)
-    {
-      observedBootstrapSegmentsLoadedIntoPageCache.add(segment);
-    }
-
-    @Override
-    public void shutdownBootstrap()
-    {
-      observedShutdownBootstrapCount.incrementAndGet();
-    }
-
-    @Override
-    public void storeInfoFile(DataSegment segment)
-    {
-    }
-
-    @Override
-    public void removeInfoFile(DataSegment segment)
-    {
-    }
-
-    @Override
-    public void cleanup(DataSegment segment)
-    {
-      observedSegmentsRemovedFromCache.add(segment);
-    }
-  }
 }
diff --git a/server/src/test/java/org/apache/druid/server/coordination/TestSegmentCacheManager.java b/server/src/test/java/org/apache/druid/server/coordination/TestSegmentCacheManager.java
new file mode 100644
index 00000000000..2cd5e8e61fe
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/server/coordination/TestSegmentCacheManager.java
@@ -0,0 +1,175 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.server.coordination;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableSet;
+import org.apache.druid.java.util.common.MapUtils;
+import org.apache.druid.segment.ReferenceCountingSegment;
+import org.apache.druid.segment.SegmentLazyLoadFailCallback;
+import org.apache.druid.segment.loading.NoopSegmentCacheManager;
+import org.apache.druid.segment.loading.TombstoneSegmentizerFactory;
+import org.apache.druid.server.TestSegmentUtils;
+import org.apache.druid.timeline.DataSegment;
+import org.joda.time.Interval;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Set;
+import java.util.concurrent.atomic.AtomicInteger;
+
+/**
+ * A local cache manager to test the bootstrapping and segment add/remove operations. It stubs only the necessary
+ * methods to support these operations; any other method invoked will throw an exception from the base class,
+ * {@link NoopSegmentCacheManager}.
+ */
+class TestSegmentCacheManager extends NoopSegmentCacheManager
+{
+  private final List<DataSegment> cachedSegments;
+
+  private final List<DataSegment> observedBootstrapSegments;
+  private final List<DataSegment> observedBootstrapSegmentsLoadedIntoPageCache;
+  private final List<DataSegment> observedSegments;
+  private final List<DataSegment> observedSegmentsLoadedIntoPageCache;
+  private final List<DataSegment> observedSegmentsRemovedFromCache;
+  private final AtomicInteger observedShutdownBootstrapCount;
+
+  TestSegmentCacheManager()
+  {
+    this(ImmutableSet.of());
+  }
+
+  TestSegmentCacheManager(final Set<DataSegment> segmentsToCache)
+  {
+    this.cachedSegments = ImmutableList.copyOf(segmentsToCache);
+    this.observedBootstrapSegments = new ArrayList<>();
+    this.observedBootstrapSegmentsLoadedIntoPageCache = new ArrayList<>();
+    this.observedSegments = new ArrayList<>();
+    this.observedSegmentsLoadedIntoPageCache = new ArrayList<>();
+    this.observedSegmentsRemovedFromCache = new ArrayList<>();
+    this.observedShutdownBootstrapCount = new AtomicInteger(0);
+  }
+
+  @Override
+  public boolean canHandleSegments()
+  {
+    return true;
+  }
+
+  @Override
+  public List<DataSegment> getCachedSegments()
+  {
+    return cachedSegments;
+  }
+
+  @Override
+  public ReferenceCountingSegment getBootstrapSegment(DataSegment segment, SegmentLazyLoadFailCallback loadFailed)
+  {
+    observedBootstrapSegments.add(segment);
+    return getSegmentInternal(segment);
+  }
+
+  @Override
+  public ReferenceCountingSegment getSegment(final DataSegment segment)
+  {
+    observedSegments.add(segment);
+    return getSegmentInternal(segment);
+  }
+
+  private ReferenceCountingSegment getSegmentInternal(final DataSegment segment)
+  {
+    if (segment.isTombstone()) {
+      return ReferenceCountingSegment
+          .wrapSegment(TombstoneSegmentizerFactory.segmentForTombstone(segment), segment.getShardSpec());
+    } else {
+      return ReferenceCountingSegment.wrapSegment(
+          new TestSegmentUtils.SegmentForTesting(
+              segment.getDataSource(),
+              (Interval) segment.getLoadSpec().get("interval"),
+              MapUtils.getString(segment.getLoadSpec(), "version")
+          ), segment.getShardSpec()
+      );
+    }
+  }
+
+  @Override
+  public void loadSegmentIntoPageCache(DataSegment segment)
+  {
+    observedSegmentsLoadedIntoPageCache.add(segment);
+  }
+
+  @Override
+  public void loadSegmentIntoPageCacheOnBootstrap(DataSegment segment)
+  {
+    observedBootstrapSegmentsLoadedIntoPageCache.add(segment);
+  }
+
+  @Override
+  public void shutdownBootstrap()
+  {
+    observedShutdownBootstrapCount.incrementAndGet();
+  }
+
+  @Override
+  public void storeInfoFile(DataSegment segment)
+  {
+  }
+
+  @Override
+  public void removeInfoFile(DataSegment segment)
+  {
+  }
+
+  @Override
+  public void cleanup(DataSegment segment)
+  {
+    observedSegmentsRemovedFromCache.add(segment);
+  }
+
+  public List<DataSegment> getObservedBootstrapSegments()
+  {
+    return observedBootstrapSegments;
+  }
+
+  public List<DataSegment> getObservedBootstrapSegmentsLoadedIntoPageCache()
+  {
+    return observedBootstrapSegmentsLoadedIntoPageCache;
+  }
+
+  public List<DataSegment> getObservedSegments()
+  {
+    return observedSegments;
+  }
+
+  public List<DataSegment> getObservedSegmentsLoadedIntoPageCache()
+  {
+    return observedSegmentsLoadedIntoPageCache;
+  }
+
+  public List<DataSegment> getObservedSegmentsRemovedFromCache()
+  {
+    return observedSegmentsRemovedFromCache;
+  }
+
+  public AtomicInteger getObservedShutdownBootstrapCount()
+  {
+    return observedShutdownBootstrapCount;
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/server/coordination/ZkCoordinatorTest.java b/server/src/test/java/org/apache/druid/server/coordination/ZkCoordinatorTest.java
index 9f5291af598..a9f7772e59d 100644
--- a/server/src/test/java/org/apache/druid/server/coordination/ZkCoordinatorTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordination/ZkCoordinatorTest.java
@@ -23,7 +23,6 @@ import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableMap;
 import org.apache.curator.utils.ZKPaths;
 import org.apache.druid.curator.CuratorTestBase;
-import org.apache.druid.guice.ServerTypeConfig;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.emitter.EmittingLogger;
 import org.apache.druid.segment.IndexIO;
@@ -42,7 +41,6 @@ import org.junit.Test;
 
 import java.util.Arrays;
 import java.util.concurrent.CountDownLatch;
-import java.util.concurrent.ScheduledExecutorService;
 
 /**
  */
@@ -103,12 +101,7 @@ public class ZkCoordinatorTest extends CuratorTestBase
     SegmentLoadDropHandler segmentLoadDropHandler = new SegmentLoadDropHandler(
         new SegmentLoaderConfig(),
         EasyMock.createNiceMock(DataSegmentAnnouncer.class),
-        EasyMock.createNiceMock(DataSegmentServerAnnouncer.class),
-        EasyMock.createNiceMock(SegmentManager.class),
-        EasyMock.createNiceMock(ScheduledExecutorService.class),
-        new ServerTypeConfig(ServerType.HISTORICAL),
-        new TestCoordinatorClient(),
-        new NoopServiceEmitter()
+        EasyMock.createNiceMock(SegmentManager.class)
     )
     {
       @Override
diff --git a/services/src/main/java/org/apache/druid/cli/CliBroker.java b/services/src/main/java/org/apache/druid/cli/CliBroker.java
index 7fe5ec57631..94160f55779 100644
--- a/services/src/main/java/org/apache/druid/cli/CliBroker.java
+++ b/services/src/main/java/org/apache/druid/cli/CliBroker.java
@@ -63,6 +63,7 @@ import org.apache.druid.server.ResponseContextConfig;
 import org.apache.druid.server.SegmentManager;
 import org.apache.druid.server.SubqueryGuardrailHelper;
 import org.apache.druid.server.SubqueryGuardrailHelperProvider;
+import org.apache.druid.server.coordination.SegmentBootstrapper;
 import org.apache.druid.server.coordination.ServerType;
 import org.apache.druid.server.coordination.ZkCoordinator;
 import org.apache.druid.server.http.BrokerResource;
@@ -172,6 +173,7 @@ public class CliBroker extends ServerRunnable
           if (isZkEnabled) {
             LifecycleModule.register(binder, ZkCoordinator.class);
           }
+          LifecycleModule.register(binder, SegmentBootstrapper.class);
 
           bindAnnouncer(
               binder,
diff --git a/services/src/main/java/org/apache/druid/cli/CliHistorical.java b/services/src/main/java/org/apache/druid/cli/CliHistorical.java
index dc1acc41f87..2e231bcdcc3 100644
--- a/services/src/main/java/org/apache/druid/cli/CliHistorical.java
+++ b/services/src/main/java/org/apache/druid/cli/CliHistorical.java
@@ -49,6 +49,7 @@ import org.apache.druid.query.lookup.LookupModule;
 import org.apache.druid.server.QueryResource;
 import org.apache.druid.server.ResponseContextConfig;
 import org.apache.druid.server.SegmentManager;
+import org.apache.druid.server.coordination.SegmentBootstrapper;
 import org.apache.druid.server.coordination.ServerManager;
 import org.apache.druid.server.coordination.ServerType;
 import org.apache.druid.server.coordination.ZkCoordinator;
@@ -125,6 +126,7 @@ public class CliHistorical extends ServerRunnable
           if (isZkEnabled) {
             LifecycleModule.register(binder, ZkCoordinator.class);
           }
+          LifecycleModule.register(binder, SegmentBootstrapper.class);
 
           JsonConfigProvider.bind(binder, "druid.historical.cache", CacheConfig.class);
           binder.install(new CacheModule());
diff --git a/services/src/main/java/org/apache/druid/cli/CliIndexer.java b/services/src/main/java/org/apache/druid/cli/CliIndexer.java
index c6b817fa4a9..312b6f6b05a 100644
--- a/services/src/main/java/org/apache/druid/cli/CliIndexer.java
+++ b/services/src/main/java/org/apache/druid/cli/CliIndexer.java
@@ -74,6 +74,7 @@ import org.apache.druid.segment.realtime.appenderator.UnifiedIndexerAppenderator
 import org.apache.druid.server.DruidNode;
 import org.apache.druid.server.ResponseContextConfig;
 import org.apache.druid.server.SegmentManager;
+import org.apache.druid.server.coordination.SegmentBootstrapper;
 import org.apache.druid.server.coordination.ServerType;
 import org.apache.druid.server.coordination.ZkCoordinator;
 import org.apache.druid.server.http.HistoricalResource;
@@ -187,6 +188,7 @@ public class CliIndexer extends ServerRunnable
             if (isZkEnabled) {
               LifecycleModule.register(binder, ZkCoordinator.class);
             }
+            LifecycleModule.register(binder, SegmentBootstrapper.class);
 
             bindAnnouncer(
                 binder,
diff --git a/services/src/main/java/org/apache/druid/cli/CliPeon.java b/services/src/main/java/org/apache/druid/cli/CliPeon.java
index 1ca8ddf539f..f78a763cec4 100644
--- a/services/src/main/java/org/apache/druid/cli/CliPeon.java
+++ b/services/src/main/java/org/apache/druid/cli/CliPeon.java
@@ -125,6 +125,7 @@ import org.apache.druid.segment.realtime.firehose.ServiceAnnouncingChatHandlerPr
 import org.apache.druid.server.DruidNode;
 import org.apache.druid.server.ResponseContextConfig;
 import org.apache.druid.server.SegmentManager;
+import org.apache.druid.server.coordination.SegmentBootstrapper;
 import org.apache.druid.server.coordination.ServerType;
 import org.apache.druid.server.coordination.ZkCoordinator;
 import org.apache.druid.server.http.HistoricalResource;
@@ -553,6 +554,7 @@ public class CliPeon extends GuiceRunnable
       if (isZkEnabled) {
         LifecycleModule.register(binder, ZkCoordinator.class);
       }
+      LifecycleModule.register(binder, SegmentBootstrapper.class);
     }
 
     @Provides

From 7c6f2b1e20e4e2904a26a9be8edf064c1af7190a Mon Sep 17 00:00:00 2001
From: Kashif Faraz <kashif.faraz@gmail.com>
Date: Mon, 8 Jul 2024 06:02:39 -0700
Subject: [PATCH 49/72] Minor log cleanup in K8sDruidNodeDiscoveryProvider
 (#16701)

---
 .../K8sDruidNodeDiscoveryProvider.java        | 31 +++++++++----------
 1 file changed, 14 insertions(+), 17 deletions(-)

diff --git a/extensions-core/kubernetes-extensions/src/main/java/org/apache/druid/k8s/discovery/K8sDruidNodeDiscoveryProvider.java b/extensions-core/kubernetes-extensions/src/main/java/org/apache/druid/k8s/discovery/K8sDruidNodeDiscoveryProvider.java
index 559b53b6080..d2472a9fde4 100644
--- a/extensions-core/kubernetes-extensions/src/main/java/org/apache/druid/k8s/discovery/K8sDruidNodeDiscoveryProvider.java
+++ b/extensions-core/kubernetes-extensions/src/main/java/org/apache/druid/k8s/discovery/K8sDruidNodeDiscoveryProvider.java
@@ -45,7 +45,6 @@ import java.util.concurrent.ConcurrentHashMap;
 import java.util.concurrent.ExecutorService;
 import java.util.concurrent.ScheduledExecutorService;
 import java.util.concurrent.TimeUnit;
-import java.util.concurrent.atomic.AtomicReference;
 import java.util.function.BooleanSupplier;
 
 @ManageLifecycle
@@ -116,7 +115,7 @@ public class K8sDruidNodeDiscoveryProvider extends DruidNodeDiscoveryProvider
     return nodeTypeWatchers.computeIfAbsent(
         nodeType,
         nType -> {
-          LOGGER.info("Creating NodeRoleWatcher for nodeRole [%s].", nType);
+          LOGGER.info("Creating NodeRoleWatcher for role[%s].", nType);
           NodeRoleWatcher nodeRoleWatcher = new NodeRoleWatcher(
               listenerExecutor,
               nType,
@@ -128,7 +127,7 @@ public class K8sDruidNodeDiscoveryProvider extends DruidNodeDiscoveryProvider
           if (startAfterCreation) {
             nodeRoleWatcher.start();
           }
-          LOGGER.info("Created NodeRoleWatcher for nodeRole [%s].", nType);
+          LOGGER.info("Created NodeRoleWatcher for role[%s].", nType);
           return nodeRoleWatcher;
         }
     );
@@ -188,7 +187,6 @@ public class K8sDruidNodeDiscoveryProvider extends DruidNodeDiscoveryProvider
 
     private final LifecycleLock lifecycleLock = new LifecycleLock();
 
-    private final AtomicReference<Closeable> watchRef = new AtomicReference<>();
     private static final Closeable STOP_MARKER = () -> {};
 
     private final NodeRole nodeRole;
@@ -221,7 +219,7 @@ public class K8sDruidNodeDiscoveryProvider extends DruidNodeDiscoveryProvider
       boolean cacheInitialized = false;
 
       if (!lifecycleLock.awaitStarted()) {
-        LOGGER.error("Lifecycle not started, Exited Watch for NodeRole [%s].", nodeRole);
+        LOGGER.error("Lifecycle not started, Exited Watch for role[%s].", nodeRole);
         return;
       }
 
@@ -236,23 +234,22 @@ public class K8sDruidNodeDiscoveryProvider extends DruidNodeDiscoveryProvider
           }
 
           keepWatching(
-              podInfo.getPodNamespace(),
               labelSelector,
               list.getResourceVersion()
           );
         }
         catch (Throwable ex) {
-          LOGGER.error(ex, "Expection while watching for NodeRole [%s].", nodeRole);
+          LOGGER.error(ex, "Exception while watching for role[%s].", nodeRole);
 
           // Wait a little before trying again.
           sleep(watcherErrorRetryWaitMS);
         }
       }
 
-      LOGGER.info("Exited Watch for NodeRole [%s].", nodeRole);
+      LOGGER.info("Exited Watch for role[%s].", nodeRole);
     }
 
-    private void keepWatching(String namespace, String labelSelector, String resourceVersion)
+    private void keepWatching(String labelSelector, String resourceVersion)
     {
       String nextResourceVersion = resourceVersion;
       while (lifecycleLock.awaitStarted(1, TimeUnit.MILLISECONDS)) {
@@ -285,7 +282,7 @@ public class K8sDruidNodeDiscoveryProvider extends DruidNodeDiscoveryProvider
               } else {
                 // Try again by starting the watch from the beginning. This can happen if the
                 // watch goes bad.
-                LOGGER.debug("Received NULL item while watching node type [%s]. Restarting watch.", this.nodeRole);
+                LOGGER.debug("Received NULL item while watching role[%s]. Restarting watch.", this.nodeRole);
                 return;
               }
             }
@@ -301,7 +298,7 @@ public class K8sDruidNodeDiscoveryProvider extends DruidNodeDiscoveryProvider
           sleep(watcherErrorRetryWaitMS);
         }
         catch (Throwable ex) {
-          LOGGER.error(ex, "Error while watching node type [%s]", this.nodeRole);
+          LOGGER.error(ex, "Error while watching role[%s]", this.nodeRole);
           sleep(watcherErrorRetryWaitMS);
         }
       }
@@ -324,11 +321,11 @@ public class K8sDruidNodeDiscoveryProvider extends DruidNodeDiscoveryProvider
       }
 
       try {
-        LOGGER.info("Starting NodeRoleWatcher for [%s]...", nodeRole);
+        LOGGER.info("Starting NodeRoleWatcher for role[%s]...", nodeRole);
         this.watchExecutor = Execs.singleThreaded(this.getClass().getName() + nodeRole.getJsonName());
         watchExecutor.submit(this::watch);
         lifecycleLock.started();
-        LOGGER.info("Started NodeRoleWatcher for [%s].", nodeRole);
+        LOGGER.info("Started NodeRoleWatcher for role[%s].", nodeRole);
       }
       finally {
         lifecycleLock.exitStart();
@@ -343,18 +340,18 @@ public class K8sDruidNodeDiscoveryProvider extends DruidNodeDiscoveryProvider
       }
 
       try {
-        LOGGER.info("Stopping NodeRoleWatcher for [%s]...", nodeRole);
+        LOGGER.info("Stopping NodeRoleWatcher for role[%s]...", nodeRole);
         // STOP_MARKER cannot throw exceptions on close(), so this is OK.
         CloseableUtils.closeAndSuppressExceptions(STOP_MARKER, e -> {});
         watchExecutor.shutdownNow();
 
         if (!watchExecutor.awaitTermination(15, TimeUnit.SECONDS)) {
-          LOGGER.warn("Failed to stop watchExecutor for NodeRoleWatcher[%s]", nodeRole);
+          LOGGER.warn("Failed to stop watchExecutor for role[%s]", nodeRole);
         }
-        LOGGER.info("Stopped NodeRoleWatcher for [%s].", nodeRole);
+        LOGGER.info("Stopped NodeRoleWatcher for role[%s].", nodeRole);
       }
       catch (Exception ex) {
-        LOGGER.error(ex, "Failed to stop NodeRoleWatcher for [%s].", nodeRole);
+        LOGGER.error(ex, "Failed to stop NodeRoleWatcher for role[%s].", nodeRole);
       }
     }
 

From 09e0eefdc39e5e5829546adf4c349005ade3efbd Mon Sep 17 00:00:00 2001
From: Clint Wylie <cwylie@apache.org>
Date: Mon, 8 Jul 2024 10:58:05 -0700
Subject: [PATCH 50/72] modify equality and typed in filter behavior for
 numeric match values on string columns (#16593)

* fix equality and typed in filter behavior for numeric match values on string columns
changes:
* EqualityFilter and TypedInfilter numeric match values against string columns will now cast strings to numeric values instead of converting the numeric values directly to string for pure string equality, which is consistent with the casts which are eaten in the SQL layer, as well as classic druid behavior
* added tests to cover numeric equality matching. Double match values in particular would fail to match the string values since `1.0` would become `'1.0'` which does not match `'1'`.
---
 .../druid/query/filter/EqualityFilter.java    | 85 +++++++++++++++----
 .../druid/query/filter/RangeFilter.java       |  3 +-
 .../druid/query/filter/TypedInFilter.java     | 66 ++++++++++++--
 .../index/IndexedUtf8ValueIndexes.java        |  2 +-
 .../segment/filter/EqualityFilterTests.java   |  6 ++
 .../druid/segment/filter/InFilterTests.java   | 23 +++++
 6 files changed, 156 insertions(+), 29 deletions(-)

diff --git a/processing/src/main/java/org/apache/druid/query/filter/EqualityFilter.java b/processing/src/main/java/org/apache/druid/query/filter/EqualityFilter.java
index 06506c64d1a..f7b2dd1cdb9 100644
--- a/processing/src/main/java/org/apache/druid/query/filter/EqualityFilter.java
+++ b/processing/src/main/java/org/apache/druid/query/filter/EqualityFilter.java
@@ -31,6 +31,7 @@ import com.google.common.collect.TreeRangeSet;
 import org.apache.druid.error.InvalidInput;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.math.expr.ExprEval;
+import org.apache.druid.math.expr.ExprType;
 import org.apache.druid.math.expr.ExpressionType;
 import org.apache.druid.query.cache.CacheKeyBuilder;
 import org.apache.druid.query.filter.vector.VectorValueMatcher;
@@ -43,12 +44,14 @@ import org.apache.druid.segment.ColumnInspector;
 import org.apache.druid.segment.ColumnProcessorFactory;
 import org.apache.druid.segment.ColumnProcessors;
 import org.apache.druid.segment.ColumnSelectorFactory;
+import org.apache.druid.segment.DimensionHandlerUtils;
 import org.apache.druid.segment.DimensionSelector;
 import org.apache.druid.segment.column.ColumnCapabilities;
 import org.apache.druid.segment.column.ColumnIndexSupplier;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.TypeSignature;
 import org.apache.druid.segment.column.TypeStrategy;
+import org.apache.druid.segment.column.Types;
 import org.apache.druid.segment.column.ValueType;
 import org.apache.druid.segment.filter.Filters;
 import org.apache.druid.segment.filter.PredicateValueMatcherFactory;
@@ -244,8 +247,9 @@ public class EqualityFilter extends AbstractOptimizableDimFilter implements Filt
   public VectorValueMatcher makeVectorMatcher(VectorColumnSelectorFactory factory)
   {
     final ColumnCapabilities capabilities = factory.getColumnCapabilities(column);
-
-    if (matchValueType.isPrimitive() && (capabilities == null || capabilities.isPrimitive())) {
+    final boolean primitiveMatch = matchValueType.isPrimitive() && (capabilities == null || capabilities.isPrimitive());
+    if (primitiveMatch && useSimpleEquality(capabilities, matchValueType)) {
+      // if possible, use simplified value matcher instead of predicate
       return ColumnProcessors.makeVectorProcessor(
           column,
           VectorValueMatcherColumnProcessorFactory.instance(),
@@ -298,6 +302,20 @@ public class EqualityFilter extends AbstractOptimizableDimFilter implements Filt
     );
   }
 
+  /**
+   * Can the match value type be cast directly to column type for equality comparison? For non-numeric match types, we
+   * just use exact string equality regardless of the column type. For numeric match value types against string columns,
+   * we instead cast the string to the match value type number for matching equality.
+   */
+  public static boolean useSimpleEquality(TypeSignature<ValueType> columnType, ColumnType matchValueType)
+  {
+    if (Types.is(columnType, ValueType.STRING)) {
+      return !matchValueType.isNumeric();
+    }
+    return true;
+  }
+
+  @Nullable
   public static BitmapColumnIndex getEqualityIndex(
       String column,
       ExprEval<?> matchValueEval,
@@ -311,20 +329,22 @@ public class EqualityFilter extends AbstractOptimizableDimFilter implements Filt
       return new AllUnknownBitmapColumnIndex(selector);
     }
 
-    final ValueIndexes valueIndexes = indexSupplier.as(ValueIndexes.class);
-    if (valueIndexes != null) {
-      // matchValueEval.value() cannot be null here due to check in the constructor
-      //noinspection DataFlowIssue
-      return valueIndexes.forValue(matchValueEval.value(), matchValueType);
-    }
+    if (useSimpleEquality(selector.getColumnCapabilities(column), matchValueType)) {
+      final ValueIndexes valueIndexes = indexSupplier.as(ValueIndexes.class);
+      if (valueIndexes != null) {
+        // matchValueEval.value() cannot be null here due to check in the constructor
+        //noinspection DataFlowIssue
+        return valueIndexes.forValue(matchValueEval.value(), matchValueType);
+      }
+      if (matchValueType.isPrimitive()) {
+        final StringValueSetIndexes stringValueSetIndexes = indexSupplier.as(StringValueSetIndexes.class);
+        if (stringValueSetIndexes != null) {
 
-    if (matchValueType.isPrimitive()) {
-      final StringValueSetIndexes stringValueSetIndexes = indexSupplier.as(StringValueSetIndexes.class);
-      if (stringValueSetIndexes != null) {
-
-        return stringValueSetIndexes.forValue(matchValueEval.asString());
+          return stringValueSetIndexes.forValue(matchValueEval.asString());
+        }
       }
     }
+
     // fall back to predicate based index if it is available
     final DruidPredicateIndexes predicateIndexes = indexSupplier.as(DruidPredicateIndexes.class);
     if (predicateIndexes != null) {
@@ -408,11 +428,38 @@ public class EqualityFilter extends AbstractOptimizableDimFilter implements Filt
     private Supplier<DruidObjectPredicate<String>> makeStringPredicateSupplier()
     {
       return Suppliers.memoize(() -> {
-        final ExprEval<?> castForComparison = ExprEval.castForEqualityComparison(matchValue, ExpressionType.STRING);
-        if (castForComparison == null) {
-          return DruidObjectPredicate.alwaysFalseWithNullUnknown();
+        // when matching strings to numeric match values, use numeric comparator to implicitly cast the string to number
+        if (matchValue.type().isNumeric()) {
+          if (matchValue.type().is(ExprType.LONG)) {
+            return value -> {
+              if (value == null) {
+                return DruidPredicateMatch.UNKNOWN;
+              }
+              final Long l = DimensionHandlerUtils.convertObjectToLong(value);
+              if (l == null) {
+                return DruidPredicateMatch.FALSE;
+              }
+              return DruidPredicateMatch.of(matchValue.asLong() == l);
+            };
+          } else {
+            return value -> {
+              if (value == null) {
+                return DruidPredicateMatch.UNKNOWN;
+              }
+              final Double d = DimensionHandlerUtils.convertObjectToDouble(value);
+              if (d == null) {
+                return DruidPredicateMatch.FALSE;
+              }
+              return DruidPredicateMatch.of(matchValue.asDouble() == d);
+            };
+          }
+        } else {
+          final ExprEval<?> castForComparison = ExprEval.castForEqualityComparison(matchValue, ExpressionType.STRING);
+          if (castForComparison == null) {
+            return DruidObjectPredicate.alwaysFalseWithNullUnknown();
+          }
+          return DruidObjectPredicate.equalTo(castForComparison.asString());
         }
-        return DruidObjectPredicate.equalTo(castForComparison.asString());
       });
     }
 
@@ -548,6 +595,10 @@ public class EqualityFilter extends AbstractOptimizableDimFilter implements Filt
     @Override
     public ValueMatcher makeDimensionProcessor(DimensionSelector selector, boolean multiValue)
     {
+      // use the predicate matcher when matching numeric values since it casts the strings to numeric types
+      if (matchValue.type().isNumeric()) {
+        return predicateMatcherFactory.makeDimensionProcessor(selector, multiValue);
+      }
       final ExprEval<?> castForComparison = ExprEval.castForEqualityComparison(matchValue, ExpressionType.STRING);
       if (castForComparison == null) {
         return ValueMatchers.makeAlwaysFalseWithNullUnknownDimensionMatcher(selector, multiValue);
diff --git a/processing/src/main/java/org/apache/druid/query/filter/RangeFilter.java b/processing/src/main/java/org/apache/druid/query/filter/RangeFilter.java
index 63fc48559ac..527b5912208 100644
--- a/processing/src/main/java/org/apache/druid/query/filter/RangeFilter.java
+++ b/processing/src/main/java/org/apache/druid/query/filter/RangeFilter.java
@@ -314,8 +314,7 @@ public class RangeFilter extends AbstractOptimizableDimFilter implements Filter
         final String upper = hasUpperBound() ? upperEval.asString() : null;
         return rangeIndexes.forRange(lower, lowerOpen, upper, upperOpen);
       }
-    }
-    if (matchValueType.isNumeric()) {
+    } else if (matchValueType.isNumeric()) {
       final NumericRangeIndexes rangeIndexes = indexSupplier.as(NumericRangeIndexes.class);
       if (rangeIndexes != null) {
         final Number lower = (Number) lowerEval.value();
diff --git a/processing/src/main/java/org/apache/druid/query/filter/TypedInFilter.java b/processing/src/main/java/org/apache/druid/query/filter/TypedInFilter.java
index 63e3fbd4541..1230b522111 100644
--- a/processing/src/main/java/org/apache/druid/query/filter/TypedInFilter.java
+++ b/processing/src/main/java/org/apache/druid/query/filter/TypedInFilter.java
@@ -36,15 +36,21 @@ import com.google.common.collect.Sets;
 import com.google.common.collect.TreeRangeSet;
 import com.google.common.hash.Hasher;
 import com.google.common.hash.Hashing;
+import com.google.common.primitives.Doubles;
 import it.unimi.dsi.fastutil.doubles.DoubleOpenHashSet;
+import it.unimi.dsi.fastutil.doubles.DoubleSet;
 import it.unimi.dsi.fastutil.floats.FloatOpenHashSet;
 import it.unimi.dsi.fastutil.longs.LongOpenHashSet;
+import it.unimi.dsi.fastutil.longs.LongSet;
 import it.unimi.dsi.fastutil.objects.ObjectArrays;
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.common.guava.GuavaUtils;
 import org.apache.druid.error.InvalidInput;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.math.expr.Evals;
+import org.apache.druid.math.expr.ExprEval;
+import org.apache.druid.math.expr.ExpressionType;
 import org.apache.druid.query.cache.CacheKeyBuilder;
 import org.apache.druid.query.filter.vector.VectorValueMatcher;
 import org.apache.druid.query.filter.vector.VectorValueMatcherColumnProcessorFactory;
@@ -301,9 +307,11 @@ public class TypedInFilter extends AbstractOptimizableDimFilter implements Filte
       }
     }
 
-    final ValueSetIndexes valueSetIndexes = indexSupplier.as(ValueSetIndexes.class);
-    if (valueSetIndexes != null) {
-      return valueSetIndexes.forSortedValues(sortedMatchValues.get(), matchValueType);
+    if (EqualityFilter.useSimpleEquality(selector.getColumnCapabilities(column), matchValueType)) {
+      final ValueSetIndexes valueSetIndexes = indexSupplier.as(ValueSetIndexes.class);
+      if (valueSetIndexes != null) {
+        return valueSetIndexes.forSortedValues(sortedMatchValues.get(), matchValueType);
+      }
     }
 
     return Filters.makePredicateIndex(
@@ -452,20 +460,20 @@ public class TypedInFilter extends AbstractOptimizableDimFilter implements Filte
   }
 
   @Nullable
-  private static Object coerceValue(@Nullable Object o, ColumnType matchValueType)
+  private static <T> T coerceValue(@Nullable Object o, ColumnType matchValueType)
   {
     if (o == null) {
       return null;
     }
     switch (matchValueType.getType()) {
       case STRING:
-        return DimensionHandlerUtils.convertObjectToString(o);
+        return (T) DimensionHandlerUtils.convertObjectToString(o);
       case LONG:
-        return DimensionHandlerUtils.convertObjectToLong(o);
+        return (T) DimensionHandlerUtils.convertObjectToLong(o);
       case FLOAT:
-        return DimensionHandlerUtils.convertObjectToFloat(o);
+        return (T) DimensionHandlerUtils.convertObjectToFloat(o);
       case DOUBLE:
-        return DimensionHandlerUtils.convertObjectToDouble(o);
+        return (T) DimensionHandlerUtils.convertObjectToDouble(o);
       default:
         throw InvalidInput.exception("Unsupported matchValueType[%s]", matchValueType);
     }
@@ -540,11 +548,51 @@ public class TypedInFilter extends AbstractOptimizableDimFilter implements Filte
         final int index = Collections.binarySearch(sortedValues, value, comparator);
         return DruidPredicateMatch.of(index >= 0);
       };
+    } else if (matchValueType.is(ValueType.LONG)) {
+      final LongSet valueSet = new LongOpenHashSet(sortedValues.size());
+      for (Object o : sortedValues) {
+        final Long l = DimensionHandlerUtils.convertObjectToLong(o);
+        if (l != null) {
+          valueSet.add(l.longValue());
+        }
+      }
+      return value -> {
+        if (value == null) {
+          return containsNull ? DruidPredicateMatch.TRUE : DruidPredicateMatch.UNKNOWN;
+        }
+        final Long castValue = GuavaUtils.tryParseLong(value);
+        if (castValue == null) {
+          return DruidPredicateMatch.FALSE;
+        }
+        return DruidPredicateMatch.of(valueSet.contains(castValue));
+      };
+    } else if (matchValueType.isNumeric()) {
+      // double or float
+      final DoubleSet valueSet = new DoubleOpenHashSet(sortedValues.size());
+      for (Object o : sortedValues) {
+        Double d = DimensionHandlerUtils.convertObjectToDouble(o);
+        if (d != null) {
+          valueSet.add(d.doubleValue());
+        }
+      }
+      return value -> {
+        if (value == null) {
+          return containsNull ? DruidPredicateMatch.TRUE : DruidPredicateMatch.UNKNOWN;
+        }
+
+        final Double d = Doubles.tryParse(value);
+        if (d == null) {
+          return DruidPredicateMatch.FALSE;
+        }
+        return DruidPredicateMatch.of(valueSet.contains(d));
+      };
     }
+
     // convert set to strings
+    final ExpressionType matchExpressionType = ExpressionType.fromColumnTypeStrict(matchValueType);
     final Set<String> stringSet = Sets.newHashSetWithExpectedSize(sortedValues.size());
     for (Object o : sortedValues) {
-      stringSet.add(Evals.asString(o));
+      stringSet.add(ExprEval.ofType(matchExpressionType, o).castTo(ExpressionType.STRING).asString());
     }
     return value -> {
       if (value == null) {
diff --git a/processing/src/main/java/org/apache/druid/segment/index/IndexedUtf8ValueIndexes.java b/processing/src/main/java/org/apache/druid/segment/index/IndexedUtf8ValueIndexes.java
index 65395d148b2..6015088d558 100644
--- a/processing/src/main/java/org/apache/druid/segment/index/IndexedUtf8ValueIndexes.java
+++ b/processing/src/main/java/org/apache/druid/segment/index/IndexedUtf8ValueIndexes.java
@@ -230,7 +230,7 @@ public final class IndexedUtf8ValueIndexes<TDictionary extends Indexed<ByteBuffe
         final Object minValueInColumn = dictionary.get(0);
         final int position = Collections.binarySearch(
             sortedValues,
-            StringUtils.fromUtf8((ByteBuffer) minValueInColumn),
+            StringUtils.fromUtf8Nullable((ByteBuffer) minValueInColumn),
             matchValueType.getNullableStrategy()
         );
         tailSet = baseSet.subList(position >= 0 ? position : -(position + 1), baseSet.size());
diff --git a/processing/src/test/java/org/apache/druid/segment/filter/EqualityFilterTests.java b/processing/src/test/java/org/apache/druid/segment/filter/EqualityFilterTests.java
index 3d35817531f..fd87969a042 100644
--- a/processing/src/test/java/org/apache/druid/segment/filter/EqualityFilterTests.java
+++ b/processing/src/test/java/org/apache/druid/segment/filter/EqualityFilterTests.java
@@ -108,6 +108,12 @@ public class EqualityFilterTests
           NotDimFilter.of(new EqualityFilter("dim0", ColumnType.LONG, 1L, null)),
           ImmutableList.of("0", "2", "3", "4", "5")
       );
+
+      assertFilterMatches(new EqualityFilter("dim0", ColumnType.DOUBLE, 1, null), ImmutableList.of("1"));
+      assertFilterMatches(
+          NotDimFilter.of(new EqualityFilter("dim0", ColumnType.DOUBLE, 1, null)),
+          ImmutableList.of("0", "2", "3", "4", "5")
+      );
     }
 
     @Test
diff --git a/processing/src/test/java/org/apache/druid/segment/filter/InFilterTests.java b/processing/src/test/java/org/apache/druid/segment/filter/InFilterTests.java
index fd8c79096c4..6f5c4b72eb1 100644
--- a/processing/src/test/java/org/apache/druid/segment/filter/InFilterTests.java
+++ b/processing/src/test/java/org/apache/druid/segment/filter/InFilterTests.java
@@ -138,6 +138,29 @@ public class InFilterTests
           NotDimFilter.of(inFilter("dim0", ColumnType.STRING, Arrays.asList("e", "x"))),
           ImmutableList.of("a", "b", "c", "d", "f")
       );
+
+      if (NullHandling.sqlCompatible()) {
+        assertTypedFilterMatches(
+            inFilter("dim1", ColumnType.LONG, Arrays.asList(2L, 10L)),
+            ImmutableList.of("b", "c")
+        );
+
+        assertTypedFilterMatches(
+            inFilter("dim1", ColumnType.DOUBLE, Arrays.asList(2.0, 10.0)),
+            ImmutableList.of("b", "c")
+        );
+      } else {
+        // in default value mode, we actually end up using a classic InDimFilter, it does not match numbers well
+        assertTypedFilterMatches(
+            inFilter("dim1", ColumnType.LONG, Arrays.asList(2L, 10L)),
+            ImmutableList.of("b", "c")
+        );
+
+        assertTypedFilterMatches(
+            inFilter("dim1", ColumnType.DOUBLE, Arrays.asList(2.0, 10.0)),
+            ImmutableList.of()
+        );
+      }
     }
     @Test
     public void testSingleValueStringColumnWithNulls()

From a9bd0eea2a9beffeaa3f3a91914d4963e609c5e0 Mon Sep 17 00:00:00 2001
From: Zoltan Haindrich <kirk@rxd.hu>
Date: Tue, 9 Jul 2024 08:58:21 +0200
Subject: [PATCH 51/72] Fix queries filtering for the same condition with both
 an IN and EQUALS to not return empty results (#16597)

temp fix until CALCITE-6435 gets fixed (released&upgraded to)
added a custom rule (FixIncorrectInExpansionTypes) to fix-up types of the affected literals
added a testcase which will alert on upgrade
---
 .../calcite/planner/CalciteRulesManager.java  |  9 ++
 .../rule/FixIncorrectInExpansionTypes.java    | 97 +++++++++++++++++++
 .../sql/calcite/CalciteSelectQueryTest.java   | 27 ++++++
 .../decoupled.iq                              |  4 +-
 4 files changed, 135 insertions(+), 2 deletions(-)
 create mode 100644 sql/src/main/java/org/apache/druid/sql/calcite/rule/FixIncorrectInExpansionTypes.java

diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalciteRulesManager.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalciteRulesManager.java
index 829c44b18c6..8d3b6a743e3 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalciteRulesManager.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalciteRulesManager.java
@@ -61,6 +61,7 @@ import org.apache.druid.sql.calcite.rule.ExtensionCalciteRuleProvider;
 import org.apache.druid.sql.calcite.rule.FilterDecomposeCoalesceRule;
 import org.apache.druid.sql.calcite.rule.FilterDecomposeConcatRule;
 import org.apache.druid.sql.calcite.rule.FilterJoinExcludePushToChildRule;
+import org.apache.druid.sql.calcite.rule.FixIncorrectInExpansionTypes;
 import org.apache.druid.sql.calcite.rule.FlattenConcatRule;
 import org.apache.druid.sql.calcite.rule.ProjectAggregatePruneUnusedCallRule;
 import org.apache.druid.sql.calcite.rule.ReverseLookupRule;
@@ -71,6 +72,7 @@ import org.apache.druid.sql.calcite.rule.logical.DruidLogicalRules;
 import org.apache.druid.sql.calcite.run.EngineFeature;
 
 import java.util.ArrayList;
+import java.util.Collections;
 import java.util.List;
 import java.util.Set;
 
@@ -291,6 +293,7 @@ public class CalciteRulesManager
     // Program that pre-processes the tree before letting the full-on VolcanoPlanner loose.
     final List<Program> prePrograms = new ArrayList<>();
     prePrograms.add(new LoggingProgram("Start", isDebug));
+    prePrograms.add(sqlToRelWorkaroundProgram());
     prePrograms.add(Programs.subQuery(DefaultRelMetadataProvider.INSTANCE));
     prePrograms.add(new LoggingProgram("Finished subquery program", isDebug));
     prePrograms.add(DecorrelateAndTrimFieldsProgram.INSTANCE);
@@ -306,6 +309,12 @@ public class CalciteRulesManager
     return Programs.sequence(prePrograms.toArray(new Program[0]));
   }
 
+  private Program sqlToRelWorkaroundProgram()
+  {
+    Set<RelOptRule> rules = Collections.singleton(new FixIncorrectInExpansionTypes());
+    return Programs.hep(rules, true, DefaultRelMetadataProvider.INSTANCE);
+  }
+
   /**
    * Program to perform manipulations on the logical tree prior to starting the cost-based planner. Mainly this
    * helps the cost-based planner finish faster, and helps the decoupled planner generate the same plans as the
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/rule/FixIncorrectInExpansionTypes.java b/sql/src/main/java/org/apache/druid/sql/calcite/rule/FixIncorrectInExpansionTypes.java
new file mode 100644
index 00000000000..9c049ac89da
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/rule/FixIncorrectInExpansionTypes.java
@@ -0,0 +1,97 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.rule;
+
+import org.apache.calcite.plan.RelOptRule;
+import org.apache.calcite.plan.RelOptRuleCall;
+import org.apache.calcite.rel.RelNode;
+import org.apache.calcite.rel.rules.SubstitutionRule;
+import org.apache.calcite.rex.RexBuilder;
+import org.apache.calcite.rex.RexCall;
+import org.apache.calcite.rex.RexNode;
+import org.apache.calcite.rex.RexShuttle;
+import org.apache.calcite.rex.RexUtil;
+import org.apache.calcite.sql.SqlKind;
+import org.apache.calcite.sql.type.SqlTypeName;
+
+/**
+ * Rewrites comparisions to avoid bug FIXME.
+ *
+ * Rewrites RexCall::VARCHAR = RexLiteral::CHAR to RexCall::VARCHAR =
+ * RexLiteral::VARCHAR
+ *
+ * needed until CALCITE-6435 is fixed & released.
+ */
+public class FixIncorrectInExpansionTypes extends RelOptRule implements SubstitutionRule
+{
+  public FixIncorrectInExpansionTypes()
+  {
+    super(operand(RelNode.class, any()));
+  }
+
+  @Override
+  public void onMatch(RelOptRuleCall call)
+  {
+    final RelNode oldNode = call.rel(0);
+    final RewriteShuttle shuttle = new RewriteShuttle(oldNode.getCluster().getRexBuilder());
+    final RelNode newNode = oldNode.accept(shuttle);
+
+    // noinspection ObjectEquality
+    if (newNode != oldNode) {
+      call.transformTo(newNode);
+      call.getPlanner().prune(oldNode);
+    }
+  }
+
+  private static class RewriteShuttle extends RexShuttle
+  {
+    private final RexBuilder rexBuilder;
+
+    public RewriteShuttle(RexBuilder rexBuilder)
+    {
+      this.rexBuilder = rexBuilder;
+    }
+
+    @Override
+    public RexNode visitCall(RexCall call)
+    {
+      RexNode newNode = super.visitCall(call);
+      if (newNode.getKind() == SqlKind.EQUALS || newNode.getKind() == SqlKind.NOT_EQUALS) {
+        RexCall newCall = (RexCall) newNode;
+        RexNode op0 = newCall.getOperands().get(0);
+        RexNode op1 = newCall.getOperands().get(1);
+        if (RexUtil.isLiteral(op1, false)) {
+
+          if (op1.getType().getSqlTypeName() == SqlTypeName.CHAR
+              && op0.getType().getSqlTypeName() == SqlTypeName.VARCHAR) {
+
+            RexNode newLiteral = rexBuilder.ensureType(op0.getType(), op1, true);
+            return rexBuilder.makeCall(
+                newCall.getOperator(),
+                op0,
+                newLiteral
+            );
+          }
+        }
+      }
+      return newNode;
+    }
+  }
+}
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSelectQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSelectQueryTest.java
index d1f256207d5..d2699e77f79 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSelectQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteSelectQueryTest.java
@@ -21,6 +21,7 @@ package org.apache.druid.sql.calcite;
 
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
+import org.apache.calcite.rel.RelNode;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.error.DruidExceptionMatcher;
 import org.apache.druid.java.util.common.DateTimes;
@@ -61,6 +62,8 @@ import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 
+import static org.junit.jupiter.api.Assertions.assertEquals;
+
 public class CalciteSelectQueryTest extends BaseCalciteQueryTest
 {
   @Test
@@ -2175,4 +2178,28 @@ public class CalciteSelectQueryTest extends BaseCalciteQueryTest
         )
         .run();
   }
+
+  @Test
+  public void testSqlToRelInConversion()
+  {
+    assertEquals(
+        "1.37.0",
+        RelNode.class.getPackage().getImplementationVersion(),
+        "Calcite version changed; check if CALCITE-6435 is fixed and remove:\n * method CalciteRulesManager#sqlToRelWorkaroundProgram\n * FixIncorrectInExpansionTypes class\n* this assertion"
+    );
+
+    testBuilder()
+        .sql(
+            "SELECT channel FROM wikipedia\n"
+                + "WHERE channel in ('#en.wikipedia') and channel = '#en.wikipedia' and\n"
+                + "isRobot = 'false'\n"
+                + "LIMIT 1"
+        )
+        .expectedResults(
+            ImmutableList.of(
+                new Object[] {"#en.wikipedia"}
+            )
+        )
+        .run();
+  }
 }
diff --git a/sql/src/test/quidem/org.apache.druid.quidem.SqlQuidemTest/decoupled.iq b/sql/src/test/quidem/org.apache.druid.quidem.SqlQuidemTest/decoupled.iq
index be52c7c4c65..530bbe172bb 100644
--- a/sql/src/test/quidem/org.apache.druid.quidem.SqlQuidemTest/decoupled.iq
+++ b/sql/src/test/quidem/org.apache.druid.quidem.SqlQuidemTest/decoupled.iq
@@ -26,13 +26,13 @@ LogicalSort(sort0=[$0], dir0=[ASC])
 LogicalSort(sort0=[$0], dir0=[ASC])
   LogicalAggregate(group=[{0}], cnt=[COUNT($1) FILTER $2], aall=[COUNT()])
     LogicalProject(cityName=[$2], channel=[$1], $f3=[IS TRUE(>($17, 0))])
-      LogicalFilter(condition=[SEARCH($2, Sarg['Aarhus':VARCHAR(8), 'New York':VARCHAR(8)]:VARCHAR(8))])
+      LogicalFilter(condition=[SEARCH($2, Sarg['Aarhus':VARCHAR, 'New York':VARCHAR]:VARCHAR)])
         LogicalTableScan(table=[[druid, wikipedia]])
 
 !logicalPlan
 DruidAggregate(group=[{0}], cnt=[COUNT($1) FILTER $2], aall=[COUNT()], druid=[logical])
   DruidProject(cityName=[$2], channel=[$1], $f3=[IS TRUE(>($17, 0))], druid=[logical])
-    DruidFilter(condition=[SEARCH($2, Sarg['Aarhus':VARCHAR(8), 'New York':VARCHAR(8)]:VARCHAR(8))])
+    DruidFilter(condition=[SEARCH($2, Sarg['Aarhus':VARCHAR, 'New York':VARCHAR]:VARCHAR)])
       DruidTableScan(table=[[druid, wikipedia]], druid=[logical])
 
 !druidPlan

From af5399cd9db609e20578e5a0f4308510b1d2cf58 Mon Sep 17 00:00:00 2001
From: Adarsh Sanjeev <adarshsanjeev@gmail.com>
Date: Tue, 9 Jul 2024 14:29:12 +0530
Subject: [PATCH 52/72] Fixes a bug when running queries with a limit clause
 (#16643)

Add a shuffling based on the resultShuffleSpecFactory after a limit processor depending on the query destination. LimitFrameProcessors currently do not update the partition boosting column, so we also add the boost column to the previous stage, if one is required.
---
 .../apache/druid/msq/exec/ControllerImpl.java |  10 +-
 .../druid/msq/indexing/MSQControllerTask.java |  28 ++-
 .../msq/querykit/groupby/GroupByQueryKit.java |   6 +-
 .../druid/msq/querykit/scan/ScanQueryKit.java | 117 +++++-----
 .../apache/druid/msq/exec/MSQExportTest.java  |  46 ++++
 .../apache/druid/msq/exec/MSQFaultsTest.java  |   3 +-
 .../apache/druid/msq/exec/MSQInsertTest.java  |  40 +++-
 .../apache/druid/msq/exec/MSQReplaceTest.java |  45 ++++
 .../apache/druid/msq/exec/MSQSelectTest.java  | 202 +++++++++++++++++-
 .../apache/druid/msq/test/MSQTestBase.java    |   4 +
 10 files changed, 421 insertions(+), 80 deletions(-)

diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
index ad37c5380c5..3ca6d5780de 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
@@ -101,9 +101,7 @@ import org.apache.druid.msq.indexing.MSQTuningConfig;
 import org.apache.druid.msq.indexing.WorkerCount;
 import org.apache.druid.msq.indexing.client.ControllerChatHandler;
 import org.apache.druid.msq.indexing.destination.DataSourceMSQDestination;
-import org.apache.druid.msq.indexing.destination.DurableStorageMSQDestination;
 import org.apache.druid.msq.indexing.destination.ExportMSQDestination;
-import org.apache.druid.msq.indexing.destination.TaskReportMSQDestination;
 import org.apache.druid.msq.indexing.error.CanceledFault;
 import org.apache.druid.msq.indexing.error.CannotParseExternalDataFault;
 import org.apache.druid.msq.indexing.error.FaultsExceededChecker;
@@ -1828,9 +1826,9 @@ public class ControllerImpl implements Controller
       );
 
       return builder.build();
-    } else if (querySpec.getDestination() instanceof TaskReportMSQDestination) {
+    } else if (MSQControllerTask.writeFinalResultsToTaskReport(querySpec)) {
       return queryDef;
-    } else if (querySpec.getDestination() instanceof DurableStorageMSQDestination) {
+    } else if (MSQControllerTask.writeFinalStageResultsToDurableStorage(querySpec)) {
 
       // attaching new query results stage if the final stage does sort during shuffle so that results are ordered.
       StageDefinition finalShuffleStageDef = queryDef.getFinalStageDefinition();
@@ -2933,12 +2931,12 @@ public class ControllerImpl implements Controller
 
       final InputChannelFactory inputChannelFactory;
 
-      if (queryKernelConfig.isDurableStorage() || MSQControllerTask.writeResultsToDurableStorage(querySpec)) {
+      if (queryKernelConfig.isDurableStorage() || MSQControllerTask.writeFinalStageResultsToDurableStorage(querySpec)) {
         inputChannelFactory = DurableStorageInputChannelFactory.createStandardImplementation(
             queryId(),
             MSQTasks.makeStorageConnector(context.injector()),
             closer,
-            MSQControllerTask.writeResultsToDurableStorage(querySpec)
+            MSQControllerTask.writeFinalStageResultsToDurableStorage(querySpec)
         );
       } else {
         inputChannelFactory = new WorkerInputChannelFactory(netClient, () -> taskIds);
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQControllerTask.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQControllerTask.java
index bdaf3964b29..b9c8ebe3b80 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQControllerTask.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQControllerTask.java
@@ -52,6 +52,7 @@ import org.apache.druid.msq.indexing.destination.DataSourceMSQDestination;
 import org.apache.druid.msq.indexing.destination.DurableStorageMSQDestination;
 import org.apache.druid.msq.indexing.destination.ExportMSQDestination;
 import org.apache.druid.msq.indexing.destination.MSQDestination;
+import org.apache.druid.msq.indexing.destination.TaskReportMSQDestination;
 import org.apache.druid.msq.util.MultiStageQueryContext;
 import org.apache.druid.query.QueryContext;
 import org.apache.druid.rpc.ServiceClientFactory;
@@ -305,16 +306,38 @@ public class MSQControllerTask extends AbstractTask implements ClientTaskQuery,
     return querySpec.getDestination().getDestinationResource();
   }
 
+  /**
+   * Checks whether the task is an ingestion into a Druid datasource.
+   */
   public static boolean isIngestion(final MSQSpec querySpec)
   {
     return querySpec.getDestination() instanceof DataSourceMSQDestination;
   }
 
+  /**
+   * Checks whether the task is an export into external files.
+   */
   public static boolean isExport(final MSQSpec querySpec)
   {
     return querySpec.getDestination() instanceof ExportMSQDestination;
   }
 
+  /**
+   * Checks whether the task is an async query which writes frame files containing the final results into durable storage.
+   */
+  public static boolean writeFinalStageResultsToDurableStorage(final MSQSpec querySpec)
+  {
+    return querySpec.getDestination() instanceof DurableStorageMSQDestination;
+  }
+
+  /**
+   * Checks whether the task is an async query which writes frame files containing the final results into durable storage.
+   */
+  public static boolean writeFinalResultsToTaskReport(final MSQSpec querySpec)
+  {
+    return querySpec.getDestination() instanceof TaskReportMSQDestination;
+  }
+
   /**
    * Returns true if the task reads from the same table as the destination. In this case, we would prefer to fail
    * instead of reading any unused segments to ensure that old data is not read.
@@ -330,11 +353,6 @@ public class MSQControllerTask extends AbstractTask implements ClientTaskQuery,
     }
   }
 
-  public static boolean writeResultsToDurableStorage(final MSQSpec querySpec)
-  {
-    return querySpec.getDestination() instanceof DurableStorageMSQDestination;
-  }
-
   @Override
   public LookupLoadingSpec getLookupLoadingSpec()
   {
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByQueryKit.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByQueryKit.java
index f02e505d0c5..eb9953402ba 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByQueryKit.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByQueryKit.java
@@ -185,13 +185,14 @@ public class GroupByQueryKit implements QueryKit<GroupByQuery>
       );
 
       if (doLimitOrOffset) {
+        final ShuffleSpec finalShuffleSpec = resultShuffleSpecFactory.build(resultClusterBy, false);
         final DefaultLimitSpec limitSpec = (DefaultLimitSpec) queryToRun.getLimitSpec();
         queryDefBuilder.add(
             StageDefinition.builder(firstStageNumber + 2)
                            .inputs(new StageInputSpec(firstStageNumber + 1))
                            .signature(resultSignature)
                            .maxWorkerCount(1)
-                           .shuffleSpec(null) // no shuffling should be required after a limit processor.
+                           .shuffleSpec(finalShuffleSpec)
                            .processorFactory(
                                new OffsetLimitFrameProcessorFactory(
                                    limitSpec.getOffset(),
@@ -224,12 +225,13 @@ public class GroupByQueryKit implements QueryKit<GroupByQuery>
       );
       if (doLimitOrOffset) {
         final DefaultLimitSpec limitSpec = (DefaultLimitSpec) queryToRun.getLimitSpec();
+        final ShuffleSpec finalShuffleSpec = resultShuffleSpecFactory.build(resultClusterBy, false);
         queryDefBuilder.add(
             StageDefinition.builder(firstStageNumber + 2)
                            .inputs(new StageInputSpec(firstStageNumber + 1))
                            .signature(resultSignature)
                            .maxWorkerCount(1)
-                           .shuffleSpec(null)
+                           .shuffleSpec(finalShuffleSpec)
                            .processorFactory(
                                new OffsetLimitFrameProcessorFactory(
                                    limitSpec.getOffset(),
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryKit.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryKit.java
index 2927264382a..48a17a9e84e 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryKit.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryKit.java
@@ -34,6 +34,7 @@ import org.apache.druid.msq.kernel.StageDefinition;
 import org.apache.druid.msq.querykit.DataSourcePlan;
 import org.apache.druid.msq.querykit.QueryKit;
 import org.apache.druid.msq.querykit.QueryKitUtils;
+import org.apache.druid.msq.querykit.ShuffleSpecFactories;
 import org.apache.druid.msq.querykit.ShuffleSpecFactory;
 import org.apache.druid.msq.querykit.common.OffsetLimitFrameProcessorFactory;
 import org.apache.druid.msq.util.MultiStageQueryContext;
@@ -111,69 +112,77 @@ public class ScanQueryKit implements QueryKit<ScanQuery>
     final ScanQuery queryToRun = originalQuery.withDataSource(dataSourcePlan.getNewDataSource());
     final int firstStageNumber = Math.max(minStageNumber, queryDefBuilder.getNextStageNumber());
     final RowSignature scanSignature = getAndValidateSignature(queryToRun, jsonMapper);
-    final ShuffleSpec shuffleSpec;
-    final RowSignature signatureToUse;
     final boolean hasLimitOrOffset = queryToRun.isLimited() || queryToRun.getScanRowsOffset() > 0;
 
+    final RowSignature.Builder signatureBuilder = RowSignature.builder().addAll(scanSignature);
+    final Granularity segmentGranularity =
+        QueryKitUtils.getSegmentGranularityFromContext(jsonMapper, queryToRun.getContext());
+    final List<KeyColumn> clusterByColumns = new ArrayList<>();
 
-    // We ignore the resultShuffleSpecFactory in case:
-    //  1. There is no cluster by
-    //  2. There is an offset which means everything gets funneled into a single partition hence we use MaxCountShuffleSpec
-    if (queryToRun.getOrderBys().isEmpty() && hasLimitOrOffset) {
-      shuffleSpec = MixShuffleSpec.instance();
-      signatureToUse = scanSignature;
-    } else {
-      final RowSignature.Builder signatureBuilder = RowSignature.builder().addAll(scanSignature);
-      final Granularity segmentGranularity =
-          QueryKitUtils.getSegmentGranularityFromContext(jsonMapper, queryToRun.getContext());
-      final List<KeyColumn> clusterByColumns = new ArrayList<>();
-
-      // Add regular orderBys.
-      for (final ScanQuery.OrderBy orderBy : queryToRun.getOrderBys()) {
-        clusterByColumns.add(
-            new KeyColumn(
-                orderBy.getColumnName(),
-                orderBy.getOrder() == ScanQuery.Order.DESCENDING ? KeyOrder.DESCENDING : KeyOrder.ASCENDING
-            )
-        );
-      }
-
-      // Update partition by of next window
-      final RowSignature signatureSoFar = signatureBuilder.build();
-      boolean addShuffle = true;
-      if (originalQuery.getContext().containsKey(MultiStageQueryContext.NEXT_WINDOW_SHUFFLE_COL)) {
-        final ClusterBy windowClusterBy = (ClusterBy) originalQuery.getContext()
-                                                                   .get(MultiStageQueryContext.NEXT_WINDOW_SHUFFLE_COL);
-        for (KeyColumn c : windowClusterBy.getColumns()) {
-          if (!signatureSoFar.contains(c.columnName())) {
-            addShuffle = false;
-            break;
-          }
-        }
-        if (addShuffle) {
-          clusterByColumns.addAll(windowClusterBy.getColumns());
-        }
-      } else {
-        // Add partition boosting column.
-        clusterByColumns.add(new KeyColumn(QueryKitUtils.PARTITION_BOOST_COLUMN, KeyOrder.ASCENDING));
-        signatureBuilder.add(QueryKitUtils.PARTITION_BOOST_COLUMN, ColumnType.LONG);
-      }
-
-
-      final ClusterBy clusterBy =
-          QueryKitUtils.clusterByWithSegmentGranularity(new ClusterBy(clusterByColumns, 0), segmentGranularity);
-      shuffleSpec = resultShuffleSpecFactory.build(clusterBy, false);
-      signatureToUse = QueryKitUtils.sortableSignature(
-          QueryKitUtils.signatureWithSegmentGranularity(signatureBuilder.build(), segmentGranularity),
-          clusterBy.getColumns()
+    // Add regular orderBys.
+    for (final ScanQuery.OrderBy orderBy : queryToRun.getOrderBys()) {
+      clusterByColumns.add(
+          new KeyColumn(
+              orderBy.getColumnName(),
+              orderBy.getOrder() == ScanQuery.Order.DESCENDING ? KeyOrder.DESCENDING : KeyOrder.ASCENDING
+          )
       );
     }
 
+    // Update partition by of next window
+    final RowSignature signatureSoFar = signatureBuilder.build();
+    boolean addShuffle = true;
+    if (originalQuery.getContext().containsKey(MultiStageQueryContext.NEXT_WINDOW_SHUFFLE_COL)) {
+      final ClusterBy windowClusterBy = (ClusterBy) originalQuery.getContext()
+                                                                 .get(MultiStageQueryContext.NEXT_WINDOW_SHUFFLE_COL);
+      for (KeyColumn c : windowClusterBy.getColumns()) {
+        if (!signatureSoFar.contains(c.columnName())) {
+          addShuffle = false;
+          break;
+        }
+      }
+      if (addShuffle) {
+        clusterByColumns.addAll(windowClusterBy.getColumns());
+      }
+    } else {
+      // Add partition boosting column.
+      clusterByColumns.add(new KeyColumn(QueryKitUtils.PARTITION_BOOST_COLUMN, KeyOrder.ASCENDING));
+      signatureBuilder.add(QueryKitUtils.PARTITION_BOOST_COLUMN, ColumnType.LONG);
+    }
+
+    final ClusterBy clusterBy =
+        QueryKitUtils.clusterByWithSegmentGranularity(new ClusterBy(clusterByColumns, 0), segmentGranularity);
+    final ShuffleSpec finalShuffleSpec = resultShuffleSpecFactory.build(clusterBy, false);
+
+    final RowSignature signatureToUse = QueryKitUtils.sortableSignature(
+        QueryKitUtils.signatureWithSegmentGranularity(signatureBuilder.build(), segmentGranularity),
+        clusterBy.getColumns()
+    );
+
+    ShuffleSpec scanShuffleSpec;
+    if (!hasLimitOrOffset) {
+      // If there is no limit spec, apply the final shuffling here itself. This will ensure partition sizes etc are respected.
+      scanShuffleSpec = finalShuffleSpec;
+    } else {
+      // If there is a limit spec, check if there are any non-boost columns to sort in.
+      boolean requiresSort = clusterByColumns.stream()
+                                             .anyMatch(keyColumn -> !QueryKitUtils.PARTITION_BOOST_COLUMN.equals(keyColumn.columnName()));
+      if (requiresSort) {
+        // If yes, do a sort into a single partition.
+        scanShuffleSpec = ShuffleSpecFactories.singlePartition().build(clusterBy, false);
+      } else {
+        // If the only clusterBy column is the boost column, we just use a mix shuffle to avoid unused shuffling.
+        // Note that we still need the boost column to be present in the row signature, since the limit stage would
+        // need it to be populated to do its own shuffling later.
+        scanShuffleSpec = MixShuffleSpec.instance();
+      }
+    }
+
     queryDefBuilder.add(
         StageDefinition.builder(Math.max(minStageNumber, queryDefBuilder.getNextStageNumber()))
                        .inputs(dataSourcePlan.getInputSpecs())
                        .broadcastInputs(dataSourcePlan.getBroadcastInputs())
-                       .shuffleSpec(shuffleSpec)
+                       .shuffleSpec(scanShuffleSpec)
                        .signature(signatureToUse)
                        .maxWorkerCount(dataSourcePlan.isSingleWorker() ? 1 : maxWorkerCount)
                        .processorFactory(new ScanQueryFrameProcessorFactory(queryToRun))
@@ -185,7 +194,7 @@ public class ScanQueryKit implements QueryKit<ScanQuery>
                          .inputs(new StageInputSpec(firstStageNumber))
                          .signature(signatureToUse)
                          .maxWorkerCount(1)
-                         .shuffleSpec(null) // no shuffling should be required after a limit processor.
+                         .shuffleSpec(finalShuffleSpec) // Apply the final shuffling after limit spec.
                          .processorFactory(
                              new OffsetLimitFrameProcessorFactory(
                                  queryToRun.getScanRowsOffset(),
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQExportTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQExportTest.java
index 71b816e78c5..538cd471420 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQExportTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQExportTest.java
@@ -316,6 +316,52 @@ public class MSQExportTest extends MSQTestBase
     }
   }
 
+  @Test
+  public void testExportWithLimit() throws IOException
+  {
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("dim1", ColumnType.STRING)
+                                            .add("cnt", ColumnType.LONG).build();
+
+    File exportDir = newTempFolder("export");
+
+    Map<String, Object> queryContext = new HashMap<>(DEFAULT_MSQ_CONTEXT);
+    queryContext.put(MultiStageQueryContext.CTX_ROWS_PER_PAGE, 1);
+
+    final String sql = StringUtils.format("insert into extern(local(exportPath=>'%s')) as csv select cnt, dim1 from foo limit 3", exportDir.getAbsolutePath());
+
+    testIngestQuery().setSql(sql)
+                     .setExpectedDataSource("foo1")
+                     .setQueryContext(queryContext)
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedSegment(ImmutableSet.of())
+                     .setExpectedResultRows(ImmutableList.of())
+                     .verifyResults();
+
+    Assert.assertEquals(
+        ImmutableList.of(
+            "cnt,dim1",
+            "1,"
+        ),
+        readResultsFromFile(new File(exportDir, "query-test-query-worker0-partition0.csv"))
+    );
+    Assert.assertEquals(
+        ImmutableList.of(
+            "cnt,dim1",
+            "1,10.1"
+        ),
+        readResultsFromFile(new File(exportDir, "query-test-query-worker0-partition1.csv"))
+    );
+    Assert.assertEquals(
+        ImmutableList.of(
+            "cnt,dim1",
+            "1,2"
+            ),
+        readResultsFromFile(new File(exportDir, "query-test-query-worker0-partition2.csv"))
+    );
+  }
+
   private void verifyManifestFile(File exportDir, List<File> resultFiles) throws IOException
   {
     final File manifestFile = new File(exportDir, ExportMetadataManager.MANIFEST_FILE);
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java
index d144e765957..b18e14b04f2 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java
@@ -46,6 +46,7 @@ import org.apache.druid.msq.indexing.error.TooManyPartitionsFault;
 import org.apache.druid.msq.indexing.error.TooManySegmentsInTimeChunkFault;
 import org.apache.druid.msq.test.MSQTestBase;
 import org.apache.druid.msq.test.MSQTestTaskActionClient;
+import org.apache.druid.msq.util.MultiStageQueryContext;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.segment.realtime.appenderator.SegmentIdWithShardSpec;
@@ -291,7 +292,7 @@ public class MSQFaultsTest extends MSQTestBase
   {
     Map<String, Object> context = ImmutableMap.<String, Object>builder()
                                               .putAll(DEFAULT_MSQ_CONTEXT)
-                                              .put("rowsPerSegment", 1)
+                                              .put(MultiStageQueryContext.CTX_ROWS_PER_SEGMENT, 1)
                                               .build();
 
 
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java
index 03ed429848a..098b143b277 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java
@@ -1455,7 +1455,7 @@ public class MSQInsertTest extends MSQTestBase
                              + "SELECT __time, m1 "
                              + "FROM foo "
                              + "LIMIT 50 "
-                             + "OFFSET 10"
+                             + "OFFSET 10 "
                              + "PARTITIONED BY ALL TIME")
                      .setExpectedValidationErrorMatcher(
                          invalidSqlContains("INSERT and REPLACE queries cannot have an OFFSET")
@@ -1464,6 +1464,44 @@ public class MSQInsertTest extends MSQTestBase
                      .verifyPlanningErrors();
   }
 
+  @MethodSource("data")
+  @ParameterizedTest(name = "{index}:with context {0}")
+  public void testInsertOnFoo1WithLimit(String contextName, Map<String, Object> context)
+  {
+    Map<String, Object> queryContext = ImmutableMap.<String, Object>builder()
+                                                   .putAll(context)
+                                                   .put(MultiStageQueryContext.CTX_ROWS_PER_SEGMENT, 2)
+                                                   .build();
+
+    List<Object[]> expectedRows = ImmutableList.of(
+        new Object[]{946771200000L, "10.1", 1L},
+        new Object[]{978307200000L, "1", 1L},
+        new Object[]{946857600000L, "2", 1L},
+        new Object[]{978480000000L, "abc", 1L}
+    );
+
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("dim1", ColumnType.STRING)
+                                            .add("cnt", ColumnType.LONG)
+                                            .build();
+
+    testIngestQuery().setSql(
+                         "insert into foo1 select __time, dim1, cnt from foo where dim1 != '' limit 4 partitioned by all clustered by dim1")
+                     .setExpectedDataSource("foo1")
+                     .setQueryContext(queryContext)
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedSegment(ImmutableSet.of(SegmentId.of("foo1", Intervals.ETERNITY, "test", 0), SegmentId.of("foo1", Intervals.ETERNITY, "test", 1)))
+                     .setExpectedResultRows(expectedRows)
+                     .setExpectedMSQSegmentReport(
+                         new MSQSegmentReport(
+                             NumberedShardSpec.class.getSimpleName(),
+                             "Using NumberedShardSpec to generate segments since the query is inserting rows."
+                         )
+                     )
+                     .verifyResults();
+  }
+
   @MethodSource("data")
   @ParameterizedTest(name = "{index}:with context {0}")
   public void testCorrectNumberOfWorkersUsedAutoModeWithoutBytesLimit(String contextName, Map<String, Object> context) throws IOException
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
index 7d7f4e310c6..2e05d447910 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
@@ -906,6 +906,51 @@ public class MSQReplaceTest extends MSQTestBase
                      .verifyResults();
   }
 
+  @MethodSource("data")
+  @ParameterizedTest(name = "{index}:with context {0}")
+  public void testReplaceOnFoo1WithLimit(String contextName, Map<String, Object> context)
+  {
+    Map<String, Object> queryContext = ImmutableMap.<String, Object>builder()
+                                                   .putAll(context)
+                                                   .put(MultiStageQueryContext.CTX_ROWS_PER_SEGMENT, 2)
+                                                   .build();
+
+    List<Object[]> expectedRows = ImmutableList.of(
+        new Object[]{946684800000L, NullHandling.sqlCompatible() ? "" : null},
+        new Object[]{978307200000L, "1"},
+        new Object[]{946771200000L, "10.1"},
+        new Object[]{946857600000L, "2"}
+    );
+
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("dim1", ColumnType.STRING)
+                                            .build();
+
+    testIngestQuery().setSql(
+                         "REPLACE INTO \"foo1\" OVERWRITE ALL\n"
+                         + "SELECT\n"
+                         + "  \"__time\",\n"
+                         + "  \"dim1\"\n"
+                         + "FROM foo\n"
+                         + "LIMIT 4\n"
+                         + "PARTITIONED BY ALL\n"
+                         + "CLUSTERED BY dim1")
+                     .setExpectedDataSource("foo1")
+                     .setQueryContext(queryContext)
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedShardSpec(DimensionRangeShardSpec.class)
+                     .setExpectedSegment(ImmutableSet.of(SegmentId.of("foo1", Intervals.ETERNITY, "test", 0), SegmentId.of("foo1", Intervals.ETERNITY, "test", 1)))
+                     .setExpectedResultRows(expectedRows)
+                     .setExpectedMSQSegmentReport(
+                         new MSQSegmentReport(
+                             DimensionRangeShardSpec.class.getSimpleName(),
+                             "Using RangeShardSpec to generate segments."
+                         )
+                     )
+                     .verifyResults();
+  }
+
   @MethodSource("data")
   @ParameterizedTest(name = "{index}:with context {0}")
   public void testReplaceTimeChunksLargerThanData(String contextName, Map<String, Object> context)
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQSelectTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQSelectTest.java
index 84dddd526c1..2d14e743497 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQSelectTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQSelectTest.java
@@ -24,6 +24,7 @@ import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.impl.CsvInputFormat;
+import org.apache.druid.data.input.impl.InlineInputSource;
 import org.apache.druid.data.input.impl.JsonInputFormat;
 import org.apache.druid.data.input.impl.LocalInputSource;
 import org.apache.druid.data.input.impl.systemfield.SystemFields;
@@ -624,8 +625,17 @@ public class MSQSelectTest extends MSQTestBase
                                                .add("dim1", ColumnType.STRING)
                                                .build();
 
+    final ImmutableList<Object[]> expectedResults = ImmutableList.of(
+        new Object[]{1L, ""},
+        new Object[]{1L, "10.1"},
+        new Object[]{1L, "2"},
+        new Object[]{1L, "1"},
+        new Object[]{1L, "def"},
+        new Object[]{1L, "abc"}
+    );
+
     testSelectQuery()
-        .setSql("select cnt,dim1 from foo limit 10")
+        .setSql("select cnt, dim1 from foo limit 10")
         .setExpectedMSQSpec(
             MSQSpec.builder()
                    .query(
@@ -646,6 +656,7 @@ public class MSQSelectTest extends MSQTestBase
         )
         .setQueryContext(context)
         .setExpectedRowSignature(resultSignature)
+        .setExpectedResultRows(expectedResults)
         .setExpectedCountersForStageWorkerChannel(
             CounterSnapshotMatcher
                 .with().totalFiles(1),
@@ -653,22 +664,31 @@ public class MSQSelectTest extends MSQTestBase
         )
         .setExpectedCountersForStageWorkerChannel(
             CounterSnapshotMatcher
-                .with().rows(6).frames(1),
+                .with().rows(6),
             0, 0, "output"
         )
         .setExpectedCountersForStageWorkerChannel(
             CounterSnapshotMatcher
-                .with().rows(6).frames(1),
+                .with().rows(6),
             0, 0, "shuffle"
         )
-        .setExpectedResultRows(ImmutableList.of(
-            new Object[]{1L, ""},
-            new Object[]{1L, "10.1"},
-            new Object[]{1L, "2"},
-            new Object[]{1L, "1"},
-            new Object[]{1L, "def"},
-            new Object[]{1L, "abc"}
-        )).verifyResults();
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(6),
+            1, 0, "input0"
+        )
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(6),
+            1, 0, "output"
+        )
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(!context.containsKey(MultiStageQueryContext.CTX_ROWS_PER_PAGE) ? new long[] {6} : new long[] {2, 2, 2}),
+            1, 0, "shuffle"
+        )
+        .setExpectedResultRows(expectedResults)
+        .verifyResults();
   }
 
   @MethodSource("data")
@@ -1699,6 +1719,166 @@ public class MSQSelectTest extends MSQTestBase
         )).verifyResults();
   }
 
+  @MethodSource("data")
+  @ParameterizedTest(name = "{index}:with context {0}")
+  public void testGroupByWithLimit(String contextName, Map<String, Object> context)
+  {
+    RowSignature expectedResultSignature = RowSignature.builder()
+                                                       .add("dim1", ColumnType.STRING)
+                                                       .add("cnt", ColumnType.LONG)
+                                                       .build();
+
+    GroupByQuery query = GroupByQuery.builder()
+                                     .setDataSource(CalciteTests.DATASOURCE1)
+                                     .setInterval(querySegmentSpec(Filtration.eternity()))
+                                     .setGranularity(Granularities.ALL)
+                                     .setDimensions(dimensions(new DefaultDimensionSpec("dim1", "d0")))
+                                     .setAggregatorSpecs(
+                                         aggregators(
+                                             new CountAggregatorFactory(
+                                                 "a0"
+                                             )
+                                         )
+                                     )
+                                     .setDimFilter(not(equality("dim1", "", ColumnType.STRING)))
+                                     .setLimit(1)
+                                     .setContext(context)
+                                     .build();
+
+    testSelectQuery()
+        .setSql("SELECT dim1, cnt FROM (SELECT dim1, COUNT(*) AS cnt FROM foo GROUP BY dim1 HAVING dim1 != '' LIMIT 1) LIMIT 20")
+        .setExpectedMSQSpec(MSQSpec.builder()
+                                   .query(query)
+                                   .columnMappings(new ColumnMappings(ImmutableList.of(
+                                       new ColumnMapping("d0", "dim1"),
+                                       new ColumnMapping("a0", "cnt")
+                                   )))
+                                   .tuningConfig(MSQTuningConfig.defaultConfig())
+                                   .destination(isDurableStorageDestination(contextName, context)
+                                                ? DurableStorageMSQDestination.INSTANCE
+                                                : TaskReportMSQDestination.INSTANCE)
+                                   .build())
+        .setExpectedRowSignature(expectedResultSignature)
+        .setQueryContext(context)
+        .setExpectedResultRows(ImmutableList.of(
+            new Object[]{"1", 1L}
+        )).verifyResults();
+  }
+
+  @MethodSource("data")
+  @ParameterizedTest(name = "{index}:with context {0}")
+  public void testGroupByWithLimitAndOrdering(String contextName, Map<String, Object> context)
+  {
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("dim1", ColumnType.STRING)
+                                            .add("count", ColumnType.LONG)
+                                            .build();
+
+    GroupByQuery query = GroupByQuery.builder()
+                                     .setDataSource(
+                                         new ExternalDataSource(
+                                             new InlineInputSource("dim1\nabc\nxyz\ndef\nxyz\nabc\nxyz\nabc\nxyz\ndef\nbbb\naaa"),
+                                             new CsvInputFormat(null, null, null, true, 0),
+                                             RowSignature.builder().add("dim1", ColumnType.STRING).build()
+                                         )
+                                     )
+                                     .setInterval(querySegmentSpec(Filtration.eternity()))
+                                     .setGranularity(Granularities.ALL)
+                                     .addOrderByColumn(new OrderByColumnSpec("a0", OrderByColumnSpec.Direction.DESCENDING, StringComparators.NUMERIC))
+                                     .addOrderByColumn(new OrderByColumnSpec("d0", OrderByColumnSpec.Direction.ASCENDING, StringComparators.LEXICOGRAPHIC))
+                                     .setDimensions(dimensions(new DefaultDimensionSpec("dim1", "d0")))
+                                     .setAggregatorSpecs(
+                                         aggregators(
+                                             new CountAggregatorFactory(
+                                                 "a0"
+                                             )
+                                         )
+                                     )
+                                     .setLimit(4)
+                                     .setContext(context)
+                                     .build();
+
+    List<Object[]> expectedRows = ImmutableList.of(
+        new Object[]{"xyz", 4L},
+        new Object[]{"abc", 3L},
+        new Object[]{"def", 2L},
+        new Object[]{"aaa", 1L}
+    );
+
+    testSelectQuery()
+        .setSql("WITH \"ext\" AS (\n"
+                + "  SELECT *\n"
+                + "  FROM TABLE(\n"
+                + "    EXTERN(\n"
+                + "      '{\"type\":\"inline\",\"data\":\"dim1\\nabc\\nxyz\\ndef\\nxyz\\nabc\\nxyz\\nabc\\nxyz\\ndef\\nbbb\\naaa\"}',\n"
+                + "      '{\"type\":\"csv\",\"findColumnsFromHeader\":true}'\n"
+                + "    )\n"
+                + "  ) EXTEND (\"dim1\" VARCHAR)\n"
+                + ")\n"
+                + "SELECT\n"
+                + "  \"dim1\",\n"
+                + "  COUNT(*) AS \"count\"\n"
+                + "FROM \"ext\"\n"
+                + "GROUP BY 1\n"
+                + "ORDER BY 2 DESC, 1\n"
+                + "LIMIT 4\n")
+        .setExpectedMSQSpec(MSQSpec.builder()
+                                   .query(query)
+                                   .columnMappings(new ColumnMappings(ImmutableList.of(
+                                       new ColumnMapping("d0", "dim1"),
+                                       new ColumnMapping("a0", "count")
+                                   )))
+                                   .tuningConfig(MSQTuningConfig.defaultConfig())
+                                   .destination(isDurableStorageDestination(contextName, context)
+                                                ? DurableStorageMSQDestination.INSTANCE
+                                                : TaskReportMSQDestination.INSTANCE)
+                                   .build())
+        .setExpectedRowSignature(rowSignature)
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().totalFiles(1),
+            0, 0, "input0"
+        )
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(5),
+            0, 0, "output"
+        )
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(5),
+            1, 0, "shuffle"
+        )
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(5),
+            1, 0, "input0"
+        )
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(5),
+            1, 0, "output"
+        )
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(5),
+            2, 0, "input0"
+        )
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(4),
+            2, 0, "output"
+        )
+        .setExpectedCountersForStageWorkerChannel(
+            CounterSnapshotMatcher
+                .with().rows(!context.containsKey(MultiStageQueryContext.CTX_ROWS_PER_PAGE) ? new long[] {4} : new long[] {2, 2}),
+            2, 0, "shuffle"
+        )
+        .setQueryContext(context)
+        .setExpectedResultRows(expectedRows)
+        .verifyResults();
+  }
+
   @MethodSource("data")
   @ParameterizedTest(name = "{index}:with context {0}")
   public void testHavingOnApproximateCountDistinct(String contextName, Map<String, Object> context)
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
index f7c9b3296ca..5f0bd545b7c 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
@@ -1288,6 +1288,10 @@ public class MSQTestBase extends BaseCalciteQueryTest
                                                                       .stream()
                                                                       .filter(segmentId -> segmentId.getInterval()
                                                                                                     .contains((Long) row[0]))
+                                                                      .filter(segmentId -> {
+                                                                        List<List<Object>> lists = segmentIdVsOutputRowsMap.get(segmentId);
+                                                                        return lists.contains(Arrays.asList(row));
+                                                                      })
                                                                       .collect(Collectors.toList());
             if (diskSegmentList.size() != 1) {
               throw new IllegalStateException("Single key in multiple partitions");

From 7c625356c52b2a45edf75b28755e70e6dc0da826 Mon Sep 17 00:00:00 2001
From: Adarsh Sanjeev <adarshsanjeev@gmail.com>
Date: Tue, 9 Jul 2024 14:37:43 +0530
Subject: [PATCH 53/72] Add logging for sketches on workers (#16697)

Improve the logging of sketches on workers.
---
 .../main/java/org/apache/druid/msq/exec/WorkerImpl.java    | 1 +
 .../druid/msq/kernel/GlobalSortMaxCountShuffleSpec.java    | 1 +
 .../druid/msq/kernel/GlobalSortTargetSizeShuffleSpec.java  | 1 +
 .../druid/msq/statistics/ClusterByStatisticsCollector.java | 5 +++++
 .../msq/statistics/ClusterByStatisticsCollectorImpl.java   | 7 ++-----
 5 files changed, 10 insertions(+), 5 deletions(-)

diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java
index 84453eaf98b..61939d82373 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java
@@ -1772,6 +1772,7 @@ public class WorkerImpl implements Worker
             @Override
             public void onSuccess(final ClusterByStatisticsCollector result)
             {
+              result.logSketches();
               kernelManipulationQueue.add(
                   holder ->
                       holder.getStageKernelMap().get(stageDefinition.getId())
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/GlobalSortMaxCountShuffleSpec.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/GlobalSortMaxCountShuffleSpec.java
index 8be2108a57a..e38fc778bb8 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/GlobalSortMaxCountShuffleSpec.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/GlobalSortMaxCountShuffleSpec.java
@@ -100,6 +100,7 @@ public class GlobalSortMaxCountShuffleSpec implements GlobalSortShuffleSpec
     } else if (maxPartitions > maxNumPartitions) {
       return Either.error((long) maxPartitions);
     } else {
+      collector.logSketches();
       final ClusterByPartitions generatedPartitions = collector.generatePartitionsWithMaxCount(maxPartitions);
       if (generatedPartitions.size() <= maxNumPartitions) {
         return Either.value(generatedPartitions);
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/GlobalSortTargetSizeShuffleSpec.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/GlobalSortTargetSizeShuffleSpec.java
index 61ae457d626..7e03a0664a8 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/GlobalSortTargetSizeShuffleSpec.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/GlobalSortTargetSizeShuffleSpec.java
@@ -99,6 +99,7 @@ public class GlobalSortTargetSizeShuffleSpec implements GlobalSortShuffleSpec
     if (expectedPartitions > maxNumPartitions) {
       return Either.error(expectedPartitions);
     } else {
+      collector.logSketches();
       final ClusterByPartitions generatedPartitions = collector.generatePartitionsWithTargetWeight(targetSize);
       if (generatedPartitions.size() <= maxNumPartitions) {
         return Either.value(generatedPartitions);
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollector.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollector.java
index fb8c8232fb8..971bf757321 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollector.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollector.java
@@ -90,6 +90,11 @@ public interface ClusterByStatisticsCollector
    */
   ClusterByPartitions generatePartitionsWithMaxCount(int maxNumPartitions);
 
+  /**
+   * Logs some information regarding the collector. This is useful in seeing which sketches were downsampled the most.
+   */
+  void logSketches();
+
   /**
    * Returns an immutable, JSON-serializable snapshot of this collector.
    */
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollectorImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollectorImpl.java
index aad5d3d5483..d89a4e80952 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollectorImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollectorImpl.java
@@ -243,8 +243,6 @@ public class ClusterByStatisticsCollectorImpl implements ClusterByStatisticsColl
   @Override
   public ClusterByPartitions generatePartitionsWithTargetWeight(final long targetWeight)
   {
-    logSketches();
-
     if (targetWeight < 1) {
       throw new IAE("Target weight must be positive");
     }
@@ -288,8 +286,6 @@ public class ClusterByStatisticsCollectorImpl implements ClusterByStatisticsColl
   @Override
   public ClusterByPartitions generatePartitionsWithMaxCount(final int maxNumPartitions)
   {
-    logSketches();
-
     if (maxNumPartitions < 1) {
       throw new IAE("Must have at least one partition");
     } else if (buckets.isEmpty()) {
@@ -331,7 +327,8 @@ public class ClusterByStatisticsCollectorImpl implements ClusterByStatisticsColl
     return ranges;
   }
 
-  private void logSketches()
+  @Override
+  public void logSketches()
   {
     if (log.isDebugEnabled()) {
       // Log all sketches

From 616ae631c62a98d2145af0a87a0e2ab3af199d1f Mon Sep 17 00:00:00 2001
From: Kashif Faraz <kashif.faraz@gmail.com>
Date: Tue, 9 Jul 2024 23:51:52 -0700
Subject: [PATCH 54/72] Fix NPE in CompactSegments (#16713)

---
 .../druid/server/coordinator/duty/CompactSegments.java       | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java b/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java
index 27f6d17638d..335912fe23e 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java
@@ -234,12 +234,13 @@ public class CompactSegments implements CoordinatorCustomDuty
     Granularity configuredSegmentGranularity = dataSourceCompactionConfig.getGranularitySpec()
                                                                          .getSegmentGranularity();
     Granularity taskSegmentGranularity = compactionTaskQuery.getGranularitySpec().getSegmentGranularity();
-    if (configuredSegmentGranularity.equals(taskSegmentGranularity)) {
+    if (configuredSegmentGranularity == null
+        || configuredSegmentGranularity.equals(taskSegmentGranularity)) {
       return false;
     }
 
     LOG.info(
-        "Cancelling task [%s] as task segmentGranularity is [%s] but compaction config segmentGranularity is [%s]",
+        "Cancelling task[%s] as task segmentGranularity[%s] differs from compaction config segmentGranularity[%s].",
         compactionTaskQuery.getId(), taskSegmentGranularity, configuredSegmentGranularity
     );
     overlordClient.cancelTask(compactionTaskQuery.getId());

From 4b293fc2a937da64cee8c1cd257a3ce85e333884 Mon Sep 17 00:00:00 2001
From: YongGang <mail.che@gmail.com>
Date: Wed, 10 Jul 2024 21:35:47 -0700
Subject: [PATCH 55/72] Docs: Fix k8s dynamic config URL (#16720)

---
 .../development/extensions-contrib/k8s-jobs.md | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/docs/development/extensions-contrib/k8s-jobs.md b/docs/development/extensions-contrib/k8s-jobs.md
index 082b8735349..913e40b9373 100644
--- a/docs/development/extensions-contrib/k8s-jobs.md
+++ b/docs/development/extensions-contrib/k8s-jobs.md
@@ -62,7 +62,7 @@ Returns a JSON object with the dynamic configuration properties.
 
 ##### URL
 
-`GET` `/druid/indexer/v1/k8s/taskRunner/executionConfig`
+`GET` `/druid/indexer/v1/k8s/taskrunner/executionconfig`
 
 ##### Responses
 
@@ -85,14 +85,14 @@ Returns a JSON object with the dynamic configuration properties.
 <TabItem value="2" label="cURL">
 
 ```shell
-curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskRunner/executionConfig"
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskrunner/executionconfig"
 ```
 </TabItem>
 
 <TabItem value="3" label="HTTP">
 
 ```HTTP
-GET /druid/indexer/v1/k8s/taskRunner/executionConfig HTTP/1.1
+GET /druid/indexer/v1/k8s/taskrunner/executionconfig HTTP/1.1
 Host: http://ROUTER_IP:ROUTER_PORT
 ```
 
@@ -134,7 +134,7 @@ Updates the dynamic configuration for the Kubernetes Task Runner
 
 ##### URL
 
-`POST` `/druid/indexer/v1/k8s/taskRunner/executionConfig`
+`POST` `/druid/indexer/v1/k8s/taskrunner/executionconfig`
 
 ##### Header parameters
 
@@ -169,7 +169,7 @@ The endpoint supports the following optional header parameters to populate the `
 
 
 ```shell
-curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskRunner/executionConfig" \
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskrunner/executionconfig" \
 --header 'Content-Type: application/json' \
 --data '{
   "type": "default",
@@ -199,7 +199,7 @@ curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskRunner/executionConf
 
 
 ```HTTP
-POST /druid/indexer/v1/k8s/taskRunner/executionConfig HTTP/1.1
+POST /druid/indexer/v1/k8s/taskrunner/executionconfig HTTP/1.1
 Host: http://ROUTER_IP:ROUTER_PORT
 Content-Type: application/json
 
@@ -240,7 +240,7 @@ an empty array if there are no history records available.
 
 ##### URL
 
-`GET` `/druid/indexer/v1/k8s/taskRunner/executionConfig/history`
+`GET` `/druid/indexer/v1/k8s/taskrunner/executionconfig/history`
 
 ##### Query parameters
 
@@ -276,7 +276,7 @@ The endpoint supports the following optional query parameters to filter results.
 
 
 ```shell
-curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskRunner/executionConfig/history"
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskrunner/executionconfig/history"
 ```
 
 </TabItem>
@@ -284,7 +284,7 @@ curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskRunner/executionConf
 
 
 ```HTTP
-GET /druid/indexer/v1/k8s/taskRunner/executionConfig/history HTTP/1.1
+GET /druid/indexer/v1/k8s/taskrunner/executionconfig/history HTTP/1.1
 Host: http://ROUTER_IP:ROUTER_PORT
 ```
 

From d6c07270a58ac93c7578eb0754d9efdfdd76c8d3 Mon Sep 17 00:00:00 2001
From: Clint Wylie <cwylie@apache.org>
Date: Thu, 11 Jul 2024 04:26:07 -0700
Subject: [PATCH 56/72] fix issues with join filter pushdown and virtual column
 resolution (#16702)

---
 .../apache/druid/segment/VirtualColumns.java  | 57 +++++++------
 .../join/HashJoinSegmentStorageAdapter.java   | 85 +++++--------------
 .../join/filter/JoinFilterAnalyzer.java       | 25 ++----
 .../join/filter/JoinFilterPreAnalysis.java    | 10 +--
 .../join/filter/JoinFilterPreAnalysisKey.java |  1 +
 .../segment/join/filter/JoinableClauses.java  | 15 ++--
 .../HashJoinSegmentStorageAdapterTest.java    | 38 ---------
 .../segment/join/JoinFilterAnalyzerTest.java  | 77 +++++++++--------
 8 files changed, 119 insertions(+), 189 deletions(-)

diff --git a/processing/src/main/java/org/apache/druid/segment/VirtualColumns.java b/processing/src/main/java/org/apache/druid/segment/VirtualColumns.java
index 583f0425c2a..79354a4fa2a 100644
--- a/processing/src/main/java/org/apache/druid/segment/VirtualColumns.java
+++ b/processing/src/main/java/org/apache/druid/segment/VirtualColumns.java
@@ -48,13 +48,12 @@ import org.apache.druid.segment.virtual.VirtualizedColumnInspector;
 import org.apache.druid.segment.virtual.VirtualizedColumnSelectorFactory;
 
 import javax.annotation.Nullable;
-
+import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.Set;
-import java.util.stream.Collectors;
 
 /**
  * Class allowing lookup and usage of virtual columns.
@@ -86,11 +85,21 @@ public class VirtualColumns implements Cacheable
   }
 
   @JsonCreator
-  public static VirtualColumns create(List<VirtualColumn> virtualColumns)
+  public static VirtualColumns create(@Nullable List<VirtualColumn> virtualColumns)
   {
     if (virtualColumns == null || virtualColumns.isEmpty()) {
       return EMPTY;
     }
+    return fromIterable(virtualColumns);
+  }
+
+  public static VirtualColumns create(VirtualColumn... virtualColumns)
+  {
+    return create(Arrays.asList(virtualColumns));
+  }
+
+  public static VirtualColumns fromIterable(Iterable<VirtualColumn> virtualColumns)
+  {
     Map<String, VirtualColumn> withDotSupport = new HashMap<>();
     Map<String, VirtualColumn> withoutDotSupport = new HashMap<>();
     for (VirtualColumn vc : virtualColumns) {
@@ -115,11 +124,6 @@ public class VirtualColumns implements Cacheable
     return new VirtualColumns(ImmutableList.copyOf(virtualColumns), withDotSupport, withoutDotSupport);
   }
 
-  public static VirtualColumns create(VirtualColumn... virtualColumns)
-  {
-    return create(Arrays.asList(virtualColumns));
-  }
-
   public static VirtualColumns nullToEmpty(@Nullable VirtualColumns virtualColumns)
   {
     return virtualColumns == null ? EMPTY : virtualColumns;
@@ -134,6 +138,14 @@ public class VirtualColumns implements Cacheable
     }
   }
 
+  // For equals, hashCode, toString, and serialization:
+  private final List<VirtualColumn> virtualColumns;
+  private final List<String> virtualColumnNames;
+
+  // For getVirtualColumn:
+  private final Map<String, VirtualColumn> withDotSupport;
+  private final Map<String, VirtualColumn> withoutDotSupport;
+
   private VirtualColumns(
       List<VirtualColumn> virtualColumns,
       Map<String, VirtualColumn> withDotSupport,
@@ -143,19 +155,14 @@ public class VirtualColumns implements Cacheable
     this.virtualColumns = virtualColumns;
     this.withDotSupport = withDotSupport;
     this.withoutDotSupport = withoutDotSupport;
+    this.virtualColumnNames = new ArrayList<>(virtualColumns.size());
 
     for (VirtualColumn virtualColumn : virtualColumns) {
       detectCycles(virtualColumn, null);
+      virtualColumnNames.add(virtualColumn.getOutputName());
     }
   }
 
-  // For equals, hashCode, toString, and serialization:
-  private final List<VirtualColumn> virtualColumns;
-
-  // For getVirtualColumn:
-  private final Map<String, VirtualColumn> withDotSupport;
-  private final Map<String, VirtualColumn> withoutDotSupport;
-
   /**
    * Returns true if a virtual column exists with a particular columnName.
    *
@@ -468,6 +475,16 @@ public class VirtualColumns implements Cacheable
     return new CacheKeyBuilder((byte) 0).appendCacheablesIgnoringOrder(virtualColumns).build();
   }
 
+  public boolean isEmpty()
+  {
+    return virtualColumns.isEmpty();
+  }
+
+  public List<String> getColumnNames()
+  {
+    return virtualColumnNames;
+  }
+
   private VirtualColumn getVirtualColumnForSelector(String columnName)
   {
     VirtualColumn virtualColumn = getVirtualColumn(columnName);
@@ -538,14 +555,4 @@ public class VirtualColumns implements Cacheable
              ((VirtualColumns) obj).virtualColumns.isEmpty();
     }
   }
-
-  public boolean isEmpty()
-  {
-    return virtualColumns.isEmpty();
-  }
-
-  public List<String> getColumnNames()
-  {
-    return virtualColumns.stream().map(v -> v.getOutputName()).collect(Collectors.toList());
-  }
 }
diff --git a/processing/src/main/java/org/apache/druid/segment/join/HashJoinSegmentStorageAdapter.java b/processing/src/main/java/org/apache/druid/segment/join/HashJoinSegmentStorageAdapter.java
index c7126448112..fd9c07a253f 100644
--- a/processing/src/main/java/org/apache/druid/segment/join/HashJoinSegmentStorageAdapter.java
+++ b/processing/src/main/java/org/apache/druid/segment/join/HashJoinSegmentStorageAdapter.java
@@ -19,7 +19,10 @@
 
 package org.apache.druid.segment.join;
 
+import com.google.common.collect.ImmutableSet;
+import com.google.common.collect.Iterables;
 import com.google.common.collect.Lists;
+import com.google.common.collect.Sets;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.granularity.Granularity;
 import org.apache.druid.java.util.common.guava.Sequence;
@@ -30,7 +33,6 @@ import org.apache.druid.query.filter.Filter;
 import org.apache.druid.segment.Cursor;
 import org.apache.druid.segment.Metadata;
 import org.apache.druid.segment.StorageAdapter;
-import org.apache.druid.segment.VirtualColumn;
 import org.apache.druid.segment.VirtualColumns;
 import org.apache.druid.segment.column.ColumnCapabilities;
 import org.apache.druid.segment.data.Indexed;
@@ -46,13 +48,10 @@ import org.joda.time.Interval;
 
 import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
-import java.util.ArrayList;
 import java.util.Arrays;
-import java.util.HashSet;
 import java.util.LinkedHashSet;
 import java.util.List;
 import java.util.Optional;
-import java.util.Set;
 
 public class HashJoinSegmentStorageAdapter implements StorageAdapter
 {
@@ -292,43 +291,40 @@ public class HashJoinSegmentStorageAdapter implements StorageAdapter
         );
 
     final JoinFilterPreAnalysisKey keyCached = joinFilterPreAnalysis.getKey();
-    final JoinFilterSplit joinFilterSplit;
-
+    final JoinFilterPreAnalysis preAnalysis;
     if (keyIn.equals(keyCached)) {
       // Common case: key used during filter pre-analysis (keyCached) matches key implied by makeCursors call (keyIn).
-      joinFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis, baseFilter);
+      preAnalysis = joinFilterPreAnalysis;
     } else {
       // Less common case: key differs. Re-analyze the filter. This case can happen when an unnest datasource is
       // layered on top of a join datasource.
-      joinFilterSplit = JoinFilterAnalyzer.splitFilter(
-          JoinFilterAnalyzer.computeJoinFilterPreAnalysis(keyIn),
-          baseFilter
-      );
+      preAnalysis = JoinFilterAnalyzer.computeJoinFilterPreAnalysis(keyIn);
     }
 
-    final List<VirtualColumn> preJoinVirtualColumns = new ArrayList<>();
-    final List<VirtualColumn> postJoinVirtualColumns = new ArrayList<>();
 
-    determineBaseColumnsWithPreAndPostJoinVirtualColumns(
-        virtualColumns,
-        preJoinVirtualColumns,
-        postJoinVirtualColumns
+    final JoinFilterSplit joinFilterSplit = JoinFilterAnalyzer.splitFilter(
+        preAnalysis,
+        baseFilter
     );
 
-    // We merge the filter on base table specified by the user and filter on the base table that is pushed from
-    // the join
-    preJoinVirtualColumns.addAll(joinFilterSplit.getPushDownVirtualColumns());
-
     final Sequence<Cursor> baseCursorSequence = baseAdapter.makeCursors(
         joinFilterSplit.getBaseTableFilter().isPresent() ? joinFilterSplit.getBaseTableFilter().get() : null,
         interval,
-        VirtualColumns.create(preJoinVirtualColumns),
+        VirtualColumns.fromIterable(
+            Iterables.concat(
+                Sets.difference(
+                    ImmutableSet.copyOf(virtualColumns.getVirtualColumns()),
+                    joinFilterPreAnalysis.getPostJoinVirtualColumns()
+                ),
+                joinFilterSplit.getPushDownVirtualColumns()
+            )
+        ),
         gran,
         descending,
         queryMetrics
     );
 
-    Closer joinablesCloser = Closer.create();
+    final Closer joinablesCloser = Closer.create();
     return Sequences.<Cursor, Cursor>map(
         baseCursorSequence,
         cursor -> {
@@ -341,7 +337,7 @@ public class HashJoinSegmentStorageAdapter implements StorageAdapter
 
           return PostJoinCursor.wrap(
               retVal,
-              VirtualColumns.create(postJoinVirtualColumns),
+              VirtualColumns.fromIterable(preAnalysis.getPostJoinVirtualColumns()),
               joinFilterSplit.getJoinTableFilter().orElse(null)
           );
         }
@@ -357,47 +353,6 @@ public class HashJoinSegmentStorageAdapter implements StorageAdapter
     return !getClauseForColumn(column).isPresent();
   }
 
-  /**
-   * Return a String set containing the name of columns that belong to the base table (including any pre-join virtual
-   * columns as well).
-   *
-   * Additionally, if the preJoinVirtualColumns and/or postJoinVirtualColumns arguments are provided, this method
-   * will add each VirtualColumn in the provided virtualColumns to either preJoinVirtualColumns or
-   * postJoinVirtualColumns based on whether the virtual column is pre-join or post-join.
-   *
-   * @param virtualColumns         List of virtual columns from the query
-   * @param preJoinVirtualColumns  If provided, virtual columns determined to be pre-join will be added to this list
-   * @param postJoinVirtualColumns If provided, virtual columns determined to be post-join will be added to this list
-   *
-   * @return The set of base column names, including any pre-join virtual columns.
-   */
-  public Set<String> determineBaseColumnsWithPreAndPostJoinVirtualColumns(
-      VirtualColumns virtualColumns,
-      @Nullable List<VirtualColumn> preJoinVirtualColumns,
-      @Nullable List<VirtualColumn> postJoinVirtualColumns
-  )
-  {
-    final Set<String> baseColumns = new HashSet<>(baseAdapter.getRowSignature().getColumnNames());
-
-    for (VirtualColumn virtualColumn : virtualColumns.getVirtualColumns()) {
-      // Virtual columns cannot depend on each other, so we don't need to check transitive dependencies.
-      if (baseColumns.containsAll(virtualColumn.requiredColumns())) {
-        // Since pre-join virtual columns can be computed using only base columns, we include them in the
-        // base column set.
-        baseColumns.add(virtualColumn.getOutputName());
-        if (preJoinVirtualColumns != null) {
-          preJoinVirtualColumns.add(virtualColumn);
-        }
-      } else {
-        if (postJoinVirtualColumns != null) {
-          postJoinVirtualColumns.add(virtualColumn);
-        }
-      }
-    }
-
-    return baseColumns;
-  }
-
   /**
    * Returns the JoinableClause corresponding to a particular column, based on the clauses' prefixes.
    *
diff --git a/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterAnalyzer.java b/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterAnalyzer.java
index a4c06e79826..d1641770fa8 100644
--- a/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterAnalyzer.java
+++ b/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterAnalyzer.java
@@ -69,8 +69,8 @@ import java.util.Set;
  *
  * The result of this pre-analysis method should be passed into the next step of join filter analysis, described below.
  *
- * The {@link #splitFilter(JoinFilterPreAnalysis)} method takes the pre-analysis result and optionally applies the
- * filter rewrite and push down operations on a per-segment level.
+ * The {@link #splitFilter(JoinFilterPreAnalysis, Filter)} method takes the pre-analysis result and optionally applies
+ * the filter rewrite and push down operations on a per-segment level.
  */
 public class JoinFilterAnalyzer
 {
@@ -90,11 +90,10 @@ public class JoinFilterAnalyzer
    */
   public static JoinFilterPreAnalysis computeJoinFilterPreAnalysis(final JoinFilterPreAnalysisKey key)
   {
-    final List<VirtualColumn> preJoinVirtualColumns = new ArrayList<>();
-    final List<VirtualColumn> postJoinVirtualColumns = new ArrayList<>();
-
     final JoinableClauses joinableClauses = JoinableClauses.fromList(key.getJoinableClauses());
-    joinableClauses.splitVirtualColumns(key.getVirtualColumns(), preJoinVirtualColumns, postJoinVirtualColumns);
+    final Set<VirtualColumn> postJoinVirtualColumns = joinableClauses.getPostJoinVirtualColumns(
+        key.getVirtualColumns()
+    );
 
     final JoinFilterPreAnalysis.Builder preAnalysisBuilder =
         new JoinFilterPreAnalysis.Builder(key, postJoinVirtualColumns);
@@ -159,13 +158,6 @@ public class JoinFilterAnalyzer
     return preAnalysisBuilder.withCorrelations(correlations).build();
   }
 
-  public static JoinFilterSplit splitFilter(
-      JoinFilterPreAnalysis joinFilterPreAnalysis
-  )
-  {
-    return splitFilter(joinFilterPreAnalysis, null);
-  }
-
   /**
    * @param joinFilterPreAnalysis The pre-analysis computed by {@link #computeJoinFilterPreAnalysis)}
    * @param baseFilter - Filter on base table that was specified in the query itself
@@ -210,7 +202,8 @@ public class JoinFilterAnalyzer
       );
       if (joinFilterAnalysis.isCanPushDown()) {
         //noinspection OptionalGetWithoutIsPresent isCanPushDown checks isPresent
-        leftFilters.add(joinFilterAnalysis.getPushDownFilter().get());
+        final Filter pushDown = joinFilterAnalysis.getPushDownFilter().get();
+        leftFilters.add(pushDown);
       }
       if (joinFilterAnalysis.isRetainAfterJoin()) {
         rightFilters.add(joinFilterAnalysis.getOriginalFilter());
@@ -519,7 +512,7 @@ public class JoinFilterAnalyzer
   }
 
   private static boolean isColumnFromPostJoinVirtualColumns(
-      List<VirtualColumn> postJoinVirtualColumns,
+      Set<VirtualColumn> postJoinVirtualColumns,
       String column
   )
   {
@@ -532,7 +525,7 @@ public class JoinFilterAnalyzer
   }
 
   private static boolean areSomeColumnsFromPostJoinVirtualColumns(
-      List<VirtualColumn> postJoinVirtualColumns,
+      Set<VirtualColumn> postJoinVirtualColumns,
       Collection<String> columns
   )
   {
diff --git a/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterPreAnalysis.java b/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterPreAnalysis.java
index b8b2e7c7830..b63b72c9f96 100644
--- a/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterPreAnalysis.java
+++ b/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterPreAnalysis.java
@@ -50,12 +50,12 @@ public class JoinFilterPreAnalysis
   private final List<Filter> normalizedBaseTableClauses;
   private final List<Filter> normalizedJoinTableClauses;
   private final JoinFilterCorrelations correlations;
-  private final List<VirtualColumn> postJoinVirtualColumns;
+  private final Set<VirtualColumn> postJoinVirtualColumns;
   private final Equiconditions equiconditions;
 
   private JoinFilterPreAnalysis(
       final JoinFilterPreAnalysisKey key,
-      final List<VirtualColumn> postJoinVirtualColumns,
+      final Set<VirtualColumn> postJoinVirtualColumns,
       final List<Filter> normalizedBaseTableClauses,
       final List<Filter> normalizedJoinTableClauses,
       final JoinFilterCorrelations correlations,
@@ -86,7 +86,7 @@ public class JoinFilterPreAnalysis
     return key.getFilter();
   }
 
-  public List<VirtualColumn> getPostJoinVirtualColumns()
+  public Set<VirtualColumn> getPostJoinVirtualColumns()
   {
     return postJoinVirtualColumns;
   }
@@ -140,13 +140,13 @@ public class JoinFilterPreAnalysis
     @Nullable
     private JoinFilterCorrelations correlations;
     @Nonnull
-    private final List<VirtualColumn> postJoinVirtualColumns;
+    private final Set<VirtualColumn> postJoinVirtualColumns;
     @Nonnull
     private Equiconditions equiconditions = new Equiconditions(Collections.emptyMap());
 
     public Builder(
         @Nonnull JoinFilterPreAnalysisKey key,
-        @Nonnull List<VirtualColumn> postJoinVirtualColumns
+        @Nonnull Set<VirtualColumn> postJoinVirtualColumns
     )
     {
       this.key = key;
diff --git a/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterPreAnalysisKey.java b/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterPreAnalysisKey.java
index fe863b0fd5b..48c00421b54 100644
--- a/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterPreAnalysisKey.java
+++ b/processing/src/main/java/org/apache/druid/segment/join/filter/JoinFilterPreAnalysisKey.java
@@ -68,6 +68,7 @@ public class JoinFilterPreAnalysisKey
     return virtualColumns;
   }
 
+  @Nullable
   public Filter getFilter()
   {
     return filter;
diff --git a/processing/src/main/java/org/apache/druid/segment/join/filter/JoinableClauses.java b/processing/src/main/java/org/apache/druid/segment/join/filter/JoinableClauses.java
index 254d4edc50a..fbf457c55a0 100644
--- a/processing/src/main/java/org/apache/druid/segment/join/filter/JoinableClauses.java
+++ b/processing/src/main/java/org/apache/druid/segment/join/filter/JoinableClauses.java
@@ -32,8 +32,10 @@ import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
 import java.util.ArrayList;
 import java.util.Collection;
+import java.util.HashSet;
 import java.util.List;
 import java.util.Optional;
+import java.util.Set;
 import java.util.stream.Collectors;
 
 public class JoinableClauses
@@ -88,19 +90,20 @@ public class JoinableClauses
     return joinableClauses;
   }
 
-  public void splitVirtualColumns(
-      final VirtualColumns virtualColumns,
-      final List<VirtualColumn> preJoinVirtualColumns,
-      final List<VirtualColumn> postJoinVirtualColumns
+  /**
+   * Retrieve subset of virtual columns which require inputs which are only present on the join table
+   */
+  public Set<VirtualColumn> getPostJoinVirtualColumns(
+      final VirtualColumns virtualColumns
   )
   {
+    final Set<VirtualColumn> postJoinVirtualColumns = new HashSet<>();
     for (VirtualColumn virtualColumn : virtualColumns.getVirtualColumns()) {
       if (areSomeColumnsFromJoin(virtualColumn.requiredColumns())) {
         postJoinVirtualColumns.add(virtualColumn);
-      } else {
-        preJoinVirtualColumns.add(virtualColumn);
       }
     }
+    return postJoinVirtualColumns;
   }
 
   public boolean areSomeColumnsFromJoin(
diff --git a/processing/src/test/java/org/apache/druid/segment/join/HashJoinSegmentStorageAdapterTest.java b/processing/src/test/java/org/apache/druid/segment/join/HashJoinSegmentStorageAdapterTest.java
index 20d032aba38..5931bff8359 100644
--- a/processing/src/test/java/org/apache/druid/segment/join/HashJoinSegmentStorageAdapterTest.java
+++ b/processing/src/test/java/org/apache/druid/segment/join/HashJoinSegmentStorageAdapterTest.java
@@ -33,7 +33,6 @@ import org.apache.druid.query.filter.Filter;
 import org.apache.druid.query.filter.InDimFilter;
 import org.apache.druid.query.filter.OrDimFilter;
 import org.apache.druid.query.filter.SelectorDimFilter;
-import org.apache.druid.segment.VirtualColumn;
 import org.apache.druid.segment.VirtualColumns;
 import org.apache.druid.segment.column.ColumnCapabilities;
 import org.apache.druid.segment.column.ValueType;
@@ -45,7 +44,6 @@ import org.apache.druid.segment.join.table.IndexedTableJoinable;
 import org.junit.Assert;
 import org.junit.Test;
 
-import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.List;
@@ -2294,42 +2292,6 @@ public class HashJoinSegmentStorageAdapterTest extends BaseHashJoinSegmentStorag
     );
   }
 
-  @Test
-  public void test_determineBaseColumnsWithPreAndPostJoinVirtualColumns()
-  {
-    List<JoinableClause> joinableClauses = ImmutableList.of(factToCountryOnIsoCode(JoinType.LEFT));
-    JoinFilterPreAnalysis analysis = makeDefaultConfigPreAnalysis(null, joinableClauses, VirtualColumns.EMPTY);
-    HashJoinSegmentStorageAdapter adapter = new HashJoinSegmentStorageAdapter(
-        factSegment.asStorageAdapter(),
-        joinableClauses,
-        analysis
-    );
-    List<VirtualColumn> expectedPreJoin = ImmutableList.of(
-        makeExpressionVirtualColumn("concat(countryIsoCode,'L')", "v0"),
-        makeExpressionVirtualColumn("concat(countryIsoCode, countryNumber)", "v1"),
-        makeExpressionVirtualColumn("channel_uniques - 1", "v2"),
-        makeExpressionVirtualColumn("channel_uniques - __time", "v3")
-    );
-
-    List<VirtualColumn> expectedPostJoin = ImmutableList.of(
-        makeExpressionVirtualColumn("concat(countryIsoCode, dummyColumn)", "v4"),
-        makeExpressionVirtualColumn("dummyMetric - __time", "v5")
-    );
-    List<VirtualColumn> actualPreJoin = new ArrayList<>();
-    List<VirtualColumn> actualPostJoin = new ArrayList<>();
-    List<VirtualColumn> allVirtualColumns = new ArrayList<>();
-    allVirtualColumns.addAll(expectedPreJoin);
-    allVirtualColumns.addAll(expectedPostJoin);
-    adapter.determineBaseColumnsWithPreAndPostJoinVirtualColumns(
-        VirtualColumns.create(allVirtualColumns),
-        actualPreJoin,
-        actualPostJoin
-    );
-
-    Assert.assertEquals(expectedPreJoin, actualPreJoin);
-    Assert.assertEquals(expectedPostJoin, actualPostJoin);
-  }
-
   @Test
   public void test_hasBuiltInFiltersForSingleJoinableClauseWithVariousJoinTypes()
   {
diff --git a/processing/src/test/java/org/apache/druid/segment/join/JoinFilterAnalyzerTest.java b/processing/src/test/java/org/apache/druid/segment/join/JoinFilterAnalyzerTest.java
index 1b7f250f847..68a77f38884 100644
--- a/processing/src/test/java/org/apache/druid/segment/join/JoinFilterAnalyzerTest.java
+++ b/processing/src/test/java/org/apache/druid/segment/join/JoinFilterAnalyzerTest.java
@@ -119,7 +119,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         null,
         ImmutableSet.of()
     );
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -183,7 +183,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         new SelectorFilter("rtc.countryName", "United States"),
         ImmutableSet.of()
     );
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -249,7 +249,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -320,7 +320,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -382,7 +382,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -461,7 +461,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -521,7 +521,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -685,7 +685,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -758,7 +758,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
 
     ExpressionVirtualColumn expectedVirtualColumn = new ExpressionVirtualColumn(
         "JOIN-FILTER-PUSHDOWN-VIRTUAL-COLUMN-0",
@@ -933,7 +933,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1013,7 +1013,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         )
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(
         expectedFilterSplit.getBaseTableFilter(),
         actualFilterSplit.getBaseTableFilter()
@@ -1103,7 +1103,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         )
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(
         expectedFilterSplit.getBaseTableFilter(),
         actualFilterSplit.getBaseTableFilter()
@@ -1171,7 +1171,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1228,7 +1228,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1284,7 +1284,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1341,7 +1341,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1396,7 +1396,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1460,7 +1460,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1523,7 +1523,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1578,7 +1578,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1632,7 +1632,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1690,7 +1690,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1747,7 +1747,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1803,7 +1803,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1858,7 +1858,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1924,7 +1924,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -1995,7 +1995,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -2074,7 +2074,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -2133,7 +2133,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -2241,7 +2241,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -2494,7 +2494,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         expectedVirtualColumns
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -2556,7 +2556,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -2630,7 +2630,7 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         ImmutableSet.of()
     );
 
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis);
+    JoinFilterSplit actualFilterSplit = split(joinFilterPreAnalysis);
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
 
@@ -2674,7 +2674,16 @@ public class JoinFilterAnalyzerTest extends BaseHashJoinSegmentStorageAdapterTes
         null,
         ImmutableSet.of()
     );
-    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(joinFilterPreAnalysis, baseTableFilter);
+    JoinFilterSplit actualFilterSplit = JoinFilterAnalyzer.splitFilter(
+        joinFilterPreAnalysis,
+        baseTableFilter
+    );
     Assert.assertEquals(expectedFilterSplit, actualFilterSplit);
   }
+
+
+  private JoinFilterSplit split(JoinFilterPreAnalysis preAnalysis)
+  {
+    return JoinFilterAnalyzer.splitFilter(preAnalysis, null);
+  }
 }

From 760d70312fbc5c56cc187f10aca7ea19b506a75e Mon Sep 17 00:00:00 2001
From: Sree Charan Manamala <sree.manamala@imply.io>
Date: Thu, 11 Jul 2024 19:11:36 +0530
Subject: [PATCH 57/72] Window Drill tests coverage improvement (#16722)

Window Drill tests coverage improvement
---
 .../org/apache/druid/sql/calcite/DrillWindowQueryTest.java  | 6 ++----
 .../java/org/apache/druid/sql/calcite/NotYetSupported.java  | 3 +--
 .../drill/window/queries/aggregates/testW_Nulls_5.q         | 2 +-
 .../drill/window/queries/aggregates/testW_Nulls_6.q         | 2 +-
 .../window/queries/frameclause/subQueries/frmInSubQry_25.q  | 2 +-
 5 files changed, 6 insertions(+), 9 deletions(-)

diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java
index baeb04fb561..cb7bed7e041 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/DrillWindowQueryTest.java
@@ -4236,7 +4236,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
     windowQueryTest();
   }
 
-  @NotYetSupported(Modes.COLUMN_NOT_FOUND)
+  @NotYetSupported(Modes.AGGREGATION_NOT_SUPPORT_TYPE)
   @DrillTest("frameclause/subQueries/frmInSubQry_25")
   @Test
   public void test_frameclause_subQueries_frmInSubQry_25()
@@ -4244,7 +4244,7 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
     windowQueryTest();
   }
 
-  @NotYetSupported(Modes.INCORRECT_SYNTAX)
+  @NotYetSupported(Modes.VIEWS_NOT_SUPPORTED)
   @DrillTest("nestedAggs/nstdWinView01")
   @Test
   public void test_nestedAggs_nstdWinView01()
@@ -5083,7 +5083,6 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
     windowQueryTest();
   }
 
-  @NotYetSupported(Modes.COLUMN_NOT_FOUND)
   @DrillTest("aggregates/testW_Nulls_5")
   @Test
   public void test_aggregates_testW_Nulls_5()
@@ -5091,7 +5090,6 @@ public class DrillWindowQueryTest extends BaseCalciteQueryTest
     windowQueryTest();
   }
 
-  @NotYetSupported(Modes.COLUMN_NOT_FOUND)
   @DrillTest("aggregates/testW_Nulls_6")
   @Test
   public void test_aggregates_testW_Nulls_6()
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/NotYetSupported.java b/sql/src/test/java/org/apache/druid/sql/calcite/NotYetSupported.java
index a3f6208f112..5d53593b7ce 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/NotYetSupported.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/NotYetSupported.java
@@ -80,13 +80,12 @@ public @interface NotYetSupported
     NOT_ENOUGH_RULES(DruidException.class, "not enough rules"),
     ERROR_HANDLING(AssertionError.class, "targetPersona: is <[A-Z]+> and category: is <[A-Z_]+> and errorCode: is"),
     EXPRESSION_NOT_GROUPED(DruidException.class, "Expression '[a-z]+' is not being grouped"),
-    COLUMN_NOT_FOUND(DruidException.class, "CalciteContextException.*Column.*not found in any table"),
     NULLS_FIRST_LAST(DruidException.class, "NULLS (FIRST|LAST)"),
     BIGINT_TO_DATE(DruidException.class, "BIGINT to type (DATE|TIME)"),
     AGGREGATION_NOT_SUPPORT_TYPE(DruidException.class, "Aggregation \\[(MIN|MAX)\\] does not support type \\[STRING\\]"),
     ALLDATA_CSV(DruidException.class, "allData.csv"),
     BIGINT_TIME_COMPARE(DruidException.class, "Cannot apply '.' to arguments of type"),
-    INCORRECT_SYNTAX(DruidException.class, "Incorrect syntax near the keyword"),
+    VIEWS_NOT_SUPPORTED(DruidException.class, "Incorrect syntax near the keyword 'CREATE'"),
     RESULT_MISMATCH(AssertionError.class, "(assertResulEquals|AssertionError: column content mismatch)"),
     LONG_CASTING(AssertionError.class, "expected: java.lang.Long"),
     UNSUPPORTED_NULL_ORDERING(DruidException.class, "(A|DE)SCENDING ordering with NULLS (LAST|FIRST)"),
diff --git a/sql/src/test/resources/drill/window/queries/aggregates/testW_Nulls_5.q b/sql/src/test/resources/drill/window/queries/aggregates/testW_Nulls_5.q
index 30ecd90da00..8f4d929313f 100644
--- a/sql/src/test/resources/drill/window/queries/aggregates/testW_Nulls_5.q
+++ b/sql/src/test/resources/drill/window/queries/aggregates/testW_Nulls_5.q
@@ -1 +1 @@
-SELECT c1, c2, w_avg FROM ( SELECT c1, c2, avg ( c1 ) OVER ( PARTITION BY c2 ORDER BY c1 ASC nulls first ) w_AVG FROM "tblWnulls.parquet" ) sub_query WHERE w_avg IS null
\ No newline at end of file
+SELECT c1, c2, w_avg FROM ( SELECT c1, c2, avg ( c1 ) OVER ( PARTITION BY c2 ORDER BY c1 ASC nulls first ) w_avg FROM "tblWnulls.parquet" ) sub_query WHERE w_avg IS null
\ No newline at end of file
diff --git a/sql/src/test/resources/drill/window/queries/aggregates/testW_Nulls_6.q b/sql/src/test/resources/drill/window/queries/aggregates/testW_Nulls_6.q
index f41206b8860..accb07b4824 100644
--- a/sql/src/test/resources/drill/window/queries/aggregates/testW_Nulls_6.q
+++ b/sql/src/test/resources/drill/window/queries/aggregates/testW_Nulls_6.q
@@ -1 +1 @@
-SELECT c1, c2, w_avg FROM ( SELECT c1, c2, avg ( c1 ) OVER ( PARTITION BY c2 ORDER BY c1 ASC nulls first ) w_AVG FROM "tblWnulls.parquet" ) sub_query
\ No newline at end of file
+SELECT c1, c2, w_avg FROM ( SELECT c1, c2, avg ( c1 ) OVER ( PARTITION BY c2 ORDER BY c1 ASC nulls first ) w_avg FROM "tblWnulls.parquet" ) sub_query
\ No newline at end of file
diff --git a/sql/src/test/resources/drill/window/queries/frameclause/subQueries/frmInSubQry_25.q b/sql/src/test/resources/drill/window/queries/frameclause/subQueries/frmInSubQry_25.q
index 5eddd9c7bef..552e2f7ee24 100644
--- a/sql/src/test/resources/drill/window/queries/frameclause/subQueries/frmInSubQry_25.q
+++ b/sql/src/test/resources/drill/window/queries/frameclause/subQueries/frmInSubQry_25.q
@@ -2,7 +2,7 @@ SELECT *
     FROM
     ( SELECT MIN(c5) OVER W as w_min,
              MIN(c5) OVER W2 as w2_min,
-             MIN(C5) OVER W3 as w3_min
+             MIN(c5) OVER W3 as w3_min
       FROM "t_alltype.parquet"
           WINDOW W AS ( PARTITION BY c8 ORDER BY c1 RANGE BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING ),
           W2 AS ( PARTITION BY c8 ORDER BY c1 ROWS BETWEEN UNBOUNDED PRECEDING AND CURRENT ROW ),

From b3c238457ff8ecc33118f8b45e212a50f5ec95d4 Mon Sep 17 00:00:00 2001
From: Clint Wylie <cwylie@apache.org>
Date: Thu, 11 Jul 2024 13:48:15 -0700
Subject: [PATCH 58/72] fix unnest bugs (#16723)

changes:
* fixes a bug with unnest storage adapter not preserving underlying columns dictionary uniqueness when allowing dimension selector cursor
* fixes a bug with unnest on realtime segments with empty rows incorrectly specifying index 0 as the row dictionary value
---
 .../druid/segment/UnnestDimensionCursor.java  |  83 ++--
 .../druid/segment/UnnestStorageAdapter.java   |   4 +-
 .../druid/query/QueryRunnerTestHelper.java    |   3 +-
 .../groupby/UnnestGroupByQueryRunnerTest.java | 434 +++++++++++++++++-
 .../segment/UnnestStorageAdapterTest.java     |   5 +-
 5 files changed, 457 insertions(+), 72 deletions(-)

diff --git a/processing/src/main/java/org/apache/druid/segment/UnnestDimensionCursor.java b/processing/src/main/java/org/apache/druid/segment/UnnestDimensionCursor.java
index 98f0d0949c8..4d4aeaf7046 100644
--- a/processing/src/main/java/org/apache/druid/segment/UnnestDimensionCursor.java
+++ b/processing/src/main/java/org/apache/druid/segment/UnnestDimensionCursor.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.segment;
 
+import com.google.common.base.Preconditions;
 import org.apache.druid.query.BaseQuery;
 import org.apache.druid.query.dimension.DefaultDimensionSpec;
 import org.apache.druid.query.dimension.DimensionSpec;
@@ -27,6 +28,7 @@ import org.apache.druid.query.filter.ValueMatcher;
 import org.apache.druid.query.monomorphicprocessing.RuntimeShapeInspector;
 import org.apache.druid.segment.column.ColumnCapabilities;
 import org.apache.druid.segment.data.IndexedInts;
+import org.checkerframework.checker.nullness.qual.MonotonicNonNull;
 import org.joda.time.DateTime;
 
 import javax.annotation.Nullable;
@@ -69,10 +71,12 @@ public class UnnestDimensionCursor implements Cursor
   private final String outputName;
   private final ColumnSelectorFactory baseColumnSelectorFactory;
   private int index;
-  @Nullable
+  @MonotonicNonNull
   private IndexedInts indexedIntsForCurrentRow;
   private boolean needInitialization;
   private SingleIndexInts indexIntsForRow;
+  private final int nullId;
+  private final int idOffset;
 
   public UnnestDimensionCursor(
       Cursor cursor,
@@ -91,11 +95,22 @@ public class UnnestDimensionCursor implements Cursor
     this.index = 0;
     this.outputName = outputColumnName;
     this.needInitialization = true;
+    // this shouldn't happen, but just in case...
+    final IdLookup lookup = Preconditions.checkNotNull(dimSelector.idLookup());
+    final int nullId = lookup.lookupId(null);
+    if (nullId < 0) {
+      this.idOffset = 1;
+      this.nullId = 0;
+    } else {
+      this.idOffset = 0;
+      this.nullId = nullId;
+    }
   }
 
   @Override
   public ColumnSelectorFactory getColumnSelectorFactory()
   {
+
     return new ColumnSelectorFactory()
     {
       @Override
@@ -110,15 +125,13 @@ public class UnnestDimensionCursor implements Cursor
           @Override
           public IndexedInts getRow()
           {
-            // This object reference has been created
-            // during the call to initialize and referenced henceforth
             return indexIntsForRow;
           }
 
           @Override
           public ValueMatcher makeValueMatcher(@Nullable String value)
           {
-            final int idForLookup = idLookup().lookupId(value);
+            final int idForLookup = dimSelector.idLookup().lookupId(value);
             if (idForLookup < 0) {
               return new ValueMatcher()
               {
@@ -131,7 +144,7 @@ public class UnnestDimensionCursor implements Cursor
                       return true;
                     }
                     final int rowId = indexedIntsForCurrentRow.get(index);
-                    return lookupName(rowId) == null;
+                    return dimSelector.lookupName(rowId) == null;
                   }
                   return false;
                 }
@@ -156,7 +169,7 @@ public class UnnestDimensionCursor implements Cursor
                   return includeUnknown;
                 }
                 final int rowId = indexedIntsForCurrentRow.get(index);
-                return (includeUnknown && lookupName(rowId) == null) || idForLookup == rowId;
+                return (includeUnknown && dimSelector.lookupName(rowId) == null) || idForLookup == rowId;
               }
 
               @Override
@@ -183,10 +196,10 @@ public class UnnestDimensionCursor implements Cursor
           @Override
           public Object getObject()
           {
-            if (indexedIntsForCurrentRow == null || indexedIntsForCurrentRow.size() == 0) {
+            if (indexedIntsForCurrentRow.size() == 0) {
               return null;
             }
-            return lookupName(indexedIntsForCurrentRow.get(index));
+            return dimSelector.lookupName(indexedIntsForCurrentRow.get(index));
           }
 
           @Override
@@ -198,14 +211,14 @@ public class UnnestDimensionCursor implements Cursor
           @Override
           public int getValueCardinality()
           {
-            return dimSelector.getValueCardinality();
+            return dimSelector.getValueCardinality() + idOffset;
           }
 
           @Nullable
           @Override
           public String lookupName(int id)
           {
-            return dimSelector.lookupName(id);
+            return dimSelector.lookupName(id - idOffset);
           }
 
           @Override
@@ -218,21 +231,19 @@ public class UnnestDimensionCursor implements Cursor
           @Override
           public IdLookup idLookup()
           {
-            return dimSelector.idLookup();
+            return name -> name == null ? nullId : dimSelector.idLookup().lookupId(name) + idOffset;
           }
         };
       }
 
-      /*
-      This ideally should not be called. If called delegate using the makeDimensionSelector
-       */
       @Override
       public ColumnValueSelector makeColumnValueSelector(String columnName)
       {
-        if (!outputName.equals(columnName)) {
-          return baseColumnSelectorFactory.makeColumnValueSelector(columnName);
+        if (outputName.equals(columnName)) {
+          return makeDimensionSelector(DefaultDimensionSpec.of(columnName));
         }
-        return makeDimensionSelector(DefaultDimensionSpec.of(columnName));
+
+        return baseColumnSelectorFactory.makeColumnValueSelector(columnName);
       }
 
       @Nullable
@@ -304,11 +315,7 @@ public class UnnestDimensionCursor implements Cursor
   {
     index = 0;
     this.indexIntsForRow = new SingleIndexInts();
-
-    if (dimSelector.getObject() != null) {
-      this.indexedIntsForCurrentRow = dimSelector.getRow();
-    }
-
+    this.indexedIntsForCurrentRow = dimSelector.getRow();
     needInitialization = false;
   }
 
@@ -320,30 +327,19 @@ public class UnnestDimensionCursor implements Cursor
    */
   private void advanceAndUpdate()
   {
-    if (indexedIntsForCurrentRow == null) {
-      index = 0;
+    if (index >= indexedIntsForCurrentRow.size() - 1) {
       if (!baseCursor.isDone()) {
         baseCursor.advanceUninterruptibly();
-        if (!baseCursor.isDone()) {
-          indexedIntsForCurrentRow = dimSelector.getRow();
-        }
       }
+      if (!baseCursor.isDone()) {
+        indexedIntsForCurrentRow = dimSelector.getRow();
+      }
+      index = 0;
     } else {
-      if (index >= indexedIntsForCurrentRow.size() - 1) {
-        if (!baseCursor.isDone()) {
-          baseCursor.advanceUninterruptibly();
-        }
-        if (!baseCursor.isDone()) {
-          indexedIntsForCurrentRow = dimSelector.getRow();
-        }
-        index = 0;
-      } else {
-        ++index;
-      }
+      ++index;
     }
   }
 
-
   // Helper class to help in returning
   // getRow from the dimensionSelector
   // This is set in the initialize method
@@ -366,12 +362,11 @@ public class UnnestDimensionCursor implements Cursor
     @Override
     public int get(int idx)
     {
-      // need to get value from the indexed ints
-      // only if it is non null and has at least 1 value
-      if (indexedIntsForCurrentRow != null && indexedIntsForCurrentRow.size() > 0) {
-        return indexedIntsForCurrentRow.get(index);
+      // everything that calls get also checks size
+      if (indexedIntsForCurrentRow.size() == 0) {
+        return nullId;
       }
-      return 0;
+      return idOffset + indexedIntsForCurrentRow.get(index);
     }
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/segment/UnnestStorageAdapter.java b/processing/src/main/java/org/apache/druid/segment/UnnestStorageAdapter.java
index 8735844c946..ff4994210e1 100644
--- a/processing/src/main/java/org/apache/druid/segment/UnnestStorageAdapter.java
+++ b/processing/src/main/java/org/apache/druid/segment/UnnestStorageAdapter.java
@@ -582,10 +582,12 @@ public class UnnestStorageAdapter implements StorageAdapter
       final TypeSignature<ValueType> outputType =
           capabilities.isArray() ? capabilities.getElementType() : capabilities.toColumnType();
 
+      final boolean useDimensionCursor = useDimensionCursor(capabilities);
       return ColumnCapabilitiesImpl.createDefault()
                                    .setType(outputType)
                                    .setHasMultipleValues(false)
-                                   .setDictionaryEncoded(useDimensionCursor(capabilities));
+                                   .setDictionaryEncoded(useDimensionCursor)
+                                   .setDictionaryValuesUnique(useDimensionCursor);
     }
   }
 
diff --git a/processing/src/test/java/org/apache/druid/query/QueryRunnerTestHelper.java b/processing/src/test/java/org/apache/druid/query/QueryRunnerTestHelper.java
index f4699639af1..e562f72955e 100644
--- a/processing/src/test/java/org/apache/druid/query/QueryRunnerTestHelper.java
+++ b/processing/src/test/java/org/apache/druid/query/QueryRunnerTestHelper.java
@@ -524,8 +524,7 @@ public class QueryRunnerTestHelper
     final DataSource base = query.getDataSource();
 
     final SegmentReference segmentReference = base.createSegmentMapFunction(query, new AtomicLong())
-                                                  .apply(ReferenceCountingSegment.wrapRootGenerationSegment(
-                                                      adapter));
+                                                  .apply(ReferenceCountingSegment.wrapRootGenerationSegment(adapter));
     return makeQueryRunner(factory, segmentReference, runnerName);
   }
 
diff --git a/processing/src/test/java/org/apache/druid/query/groupby/UnnestGroupByQueryRunnerTest.java b/processing/src/test/java/org/apache/druid/query/groupby/UnnestGroupByQueryRunnerTest.java
index 13a33191e8e..3976a20bd2d 100644
--- a/processing/src/test/java/org/apache/druid/query/groupby/UnnestGroupByQueryRunnerTest.java
+++ b/processing/src/test/java/org/apache/druid/query/groupby/UnnestGroupByQueryRunnerTest.java
@@ -25,7 +25,10 @@ import com.google.common.base.Suppliers;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.data.input.ListBasedInputRow;
+import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.DataSource;
 import org.apache.druid.query.DirectQueryProcessingPool;
@@ -43,21 +46,30 @@ import org.apache.druid.query.extraction.StringFormatExtractionFn;
 import org.apache.druid.query.filter.EqualityFilter;
 import org.apache.druid.query.filter.NotDimFilter;
 import org.apache.druid.query.groupby.orderby.OrderByColumnSpec;
+import org.apache.druid.query.spec.MultipleIntervalSegmentSpec;
 import org.apache.druid.segment.IncrementalIndexSegment;
+import org.apache.druid.segment.IndexBuilder;
+import org.apache.druid.segment.QueryableIndex;
+import org.apache.druid.segment.QueryableIndexSegment;
 import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.TestIndex;
 import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.segment.incremental.IncrementalIndex;
+import org.apache.druid.segment.incremental.IncrementalIndexSchema;
 import org.apache.druid.segment.virtual.ExpressionVirtualColumn;
 import org.apache.druid.testing.InitializedNullHandlingTest;
+import org.joda.time.DateTime;
 import org.junit.AfterClass;
 import org.junit.BeforeClass;
 import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
+import org.junit.rules.TemporaryFolder;
 import org.junit.runner.RunWith;
 import org.junit.runners.Parameterized;
 
+import java.io.IOException;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collection;
@@ -78,6 +90,9 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
   @Rule
   public ExpectedException expectedException = ExpectedException.none();
 
+  @Rule
+  public final TemporaryFolder tempFolder = new TemporaryFolder();
+
   public UnnestGroupByQueryRunnerTest(
       GroupByQueryConfig config,
       GroupByQueryRunnerFactory factory,
@@ -214,6 +229,11 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
     return GroupByQueryRunnerTestHelper.createExpectedRow(query, timestamp, vals);
   }
 
+  private static ResultRow makeRow(final GroupByQuery query, final DateTime timestamp, final Object... vals)
+  {
+    return GroupByQueryRunnerTestHelper.createExpectedRow(query, timestamp, vals);
+  }
+
   @Test
   public void testGroupBy()
   {
@@ -423,6 +443,9 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
 
     Iterable<ResultRow> results = runQuery(query, TestIndex.getIncrementalTestIndex());
     TestHelper.assertExpectedObjects(expectedResults, results, "groupBy");
+
+    results = runQuery(query, TestIndex.getMMappedTestIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "groupBy");
   }
 
   @Test
@@ -462,6 +485,9 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
 
     Iterable<ResultRow> results = runQuery(query, TestIndex.getIncrementalTestIndex());
     TestHelper.assertExpectedObjects(expectedResults, results, "missing-column");
+
+    results = runQuery(query, TestIndex.getMMappedTestIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "missing-column");
   }
 
   @Test
@@ -538,6 +564,9 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
 
     Iterable<ResultRow> results = runQuery(query, TestIndex.getIncrementalTestIndex());
     TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-column");
+
+    results = runQuery(query, TestIndex.getMMappedTestIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-column");
   }
 
   @Test
@@ -627,6 +656,9 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
 
     Iterable<ResultRow> results = runQuery(query, TestIndex.getIncrementalTestIndex());
     TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-virtual-column");
+
+    results = runQuery(query, TestIndex.getMMappedTestIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-virtual-column");
   }
 
   @Test
@@ -678,35 +710,335 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
 
     Iterable<ResultRow> results = runQuery(query, TestIndex.getIncrementalTestIndex());
     TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-virtual-columns");
+
+    results = runQuery(query, TestIndex.getMMappedTestIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-virtual-column");
   }
 
-  /**
-   * Use this method instead of makeQueryBuilder() to make sure the context is set properly. Also, avoid
-   * setContext in tests. Only use overrideContext.
-   */
-  private GroupByQuery.Builder makeQueryBuilder()
+  @Test
+  public void testGroupByOnUnnestedStringColumnWithNullStuff() throws IOException
   {
-    return GroupByQuery.builder().overrideContext(makeContext());
-  }
+    cannotVectorize();
 
-  private Iterable<ResultRow> runQuery(final GroupByQuery query, final IncrementalIndex index)
-  {
-    final QueryRunner<?> queryRunner = factory.mergeRunners(
-        DirectQueryProcessingPool.INSTANCE,
-        Collections.singletonList(
-            QueryRunnerTestHelper.makeQueryRunnerWithSegmentMapFn(
-                factory,
-                new IncrementalIndexSegment(
-                    index,
-                    QueryRunnerTestHelper.SEGMENT_ID
-                ),
-                query,
-                "rtIndexvc"
-            )
-        )
+    final String dim = "mvd";
+    final DateTime timestamp = DateTimes.nowUtc();
+    final RowSignature signature = RowSignature.builder()
+                                               .add(dim, ColumnType.STRING)
+                                               .build();
+    List<String> dims = Collections.singletonList(dim);
+    IndexBuilder bob =
+        IndexBuilder.create()
+                    .schema(
+                        IncrementalIndexSchema.builder()
+                                              .withRollup(false)
+                                              .build()
+                    )
+                    .rows(
+                        ImmutableList.of(
+                            new ListBasedInputRow(signature, timestamp, dims, ImmutableList.of(ImmutableList.of("a", "b", "c"))),
+                            new ListBasedInputRow(signature, timestamp, dims, ImmutableList.of()),
+                            new ListBasedInputRow(signature, timestamp, dims, ImmutableList.of(ImmutableList.of())),
+                            new ListBasedInputRow(signature, timestamp, dims, ImmutableList.of(""))
+                        )
+                    );
+
+    final DataSource unnestDataSource = UnnestDataSource.create(
+        new TableDataSource(QueryRunnerTestHelper.DATA_SOURCE),
+        new ExpressionVirtualColumn(
+            "v0",
+            "mvd",
+            ColumnType.STRING,
+            TestExprMacroTable.INSTANCE
+        ),
+        null
     );
 
-    return GroupByQueryRunnerTestHelper.runQuery(factory, queryRunner, query);
+    GroupByQuery query = makeQueryBuilder()
+        .setDataSource(unnestDataSource)
+        .setQuerySegmentSpec(new MultipleIntervalSegmentSpec(Collections.singletonList(Intervals.ETERNITY)))
+        .setDimensions(new DefaultDimensionSpec("v0", "v0"))
+        .setAggregatorSpecs(QueryRunnerTestHelper.ROWS_COUNT)
+        .setGranularity(QueryRunnerTestHelper.ALL_GRAN)
+        .build();
+
+    List<ResultRow> expectedResults = NullHandling.sqlCompatible() ? Arrays.asList(
+        makeRow(query, timestamp, "v0", null, "rows", 2L),
+        makeRow(query, timestamp, "v0", "", "rows", 1L),
+        makeRow(query, timestamp, "v0", "a", "rows", 1L),
+        makeRow(query, timestamp, "v0", "b", "rows", 1L),
+        makeRow(query, timestamp, "v0", "c", "rows", 1L)
+    ) : Arrays.asList(
+        makeRow(query, timestamp, "v0", null, "rows", 3L),
+        makeRow(query, timestamp, "v0", "a", "rows", 1L),
+        makeRow(query, timestamp, "v0", "b", "rows", 1L),
+        makeRow(query, timestamp, "v0", "c", "rows", 1L)
+    );
+
+    Iterable<ResultRow> results = runQuery(query, bob.buildIncrementalIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-string-nulls");
+
+    results = runQuery(query, bob.tmpDir(tempFolder.newFolder()).buildMMappedIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-string-nulls");
+  }
+
+  @Test
+  public void testGroupByOnUnnestedStringColumnWithMoreNullStuff() throws IOException
+  {
+    cannotVectorize();
+
+    final String dim = "mvd";
+    final DateTime timestamp = DateTimes.nowUtc();
+    final RowSignature signature = RowSignature.builder()
+                                               .add(dim, ColumnType.STRING)
+                                               .build();
+    List<String> dims = Collections.singletonList(dim);
+    IndexBuilder bob =
+        IndexBuilder.create()
+                    .schema(
+                        IncrementalIndexSchema.builder()
+                                              .withRollup(false)
+                                              .build()
+                    )
+                    .rows(
+                        ImmutableList.of(
+                            new ListBasedInputRow(signature, timestamp, dims, Collections.singletonList(Arrays.asList("a", "b", "c"))),
+                            new ListBasedInputRow(signature, timestamp, dims, Collections.emptyList()),
+                            new ListBasedInputRow(signature, timestamp, dims, Collections.singletonList(null)),
+                            new ListBasedInputRow(signature, timestamp, dims, Collections.singletonList(Collections.emptyList())),
+                            new ListBasedInputRow(signature, timestamp, dims, Collections.singletonList(Arrays.asList(null, null))),
+                            new ListBasedInputRow(signature, timestamp, dims, Collections.singletonList(Collections.singletonList(null))),
+                            new ListBasedInputRow(signature, timestamp, dims, Collections.singletonList(Collections.singletonList("")))
+                        )
+                    );
+
+    final DataSource unnestDataSource = UnnestDataSource.create(
+        new TableDataSource(QueryRunnerTestHelper.DATA_SOURCE),
+        new ExpressionVirtualColumn(
+            "v0",
+            "mvd",
+            ColumnType.STRING,
+            TestExprMacroTable.INSTANCE
+        ),
+        null
+    );
+
+    GroupByQuery query = makeQueryBuilder()
+        .setDataSource(unnestDataSource)
+        .setQuerySegmentSpec(new MultipleIntervalSegmentSpec(Collections.singletonList(Intervals.ETERNITY)))
+        .setDimensions(new DefaultDimensionSpec("v0", "v0"))
+        .setAggregatorSpecs(QueryRunnerTestHelper.ROWS_COUNT)
+        .setGranularity(QueryRunnerTestHelper.ALL_GRAN)
+        .build();
+
+    // make sure results are consistent with grouping directly on the column with implicit unnest
+    GroupByQuery regularQuery = makeQueryBuilder()
+        .setDataSource(new TableDataSource(QueryRunnerTestHelper.DATA_SOURCE))
+        .setQuerySegmentSpec(new MultipleIntervalSegmentSpec(Collections.singletonList(Intervals.ETERNITY)))
+        .setDimensions(new DefaultDimensionSpec("mvd", "v0"))
+        .setAggregatorSpecs(QueryRunnerTestHelper.ROWS_COUNT)
+        .setGranularity(QueryRunnerTestHelper.ALL_GRAN)
+        .build();
+
+    List<ResultRow> expectedResults = NullHandling.sqlCompatible() ? Arrays.asList(
+        makeRow(query, timestamp, "v0", null, "rows", 6L),
+        makeRow(query, timestamp, "v0", "", "rows", 1L),
+        makeRow(query, timestamp, "v0", "a", "rows", 1L),
+        makeRow(query, timestamp, "v0", "b", "rows", 1L),
+        makeRow(query, timestamp, "v0", "c", "rows", 1L)
+    ) : Arrays.asList(
+        makeRow(query, timestamp, "v0", null, "rows", 7L),
+        makeRow(query, timestamp, "v0", "a", "rows", 1L),
+        makeRow(query, timestamp, "v0", "b", "rows", 1L),
+        makeRow(query, timestamp, "v0", "c", "rows", 1L)
+    );
+
+    Iterable<ResultRow> results = runQuery(query, bob.buildIncrementalIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-string-nulls");
+
+    results = runQuery(regularQuery, bob.buildIncrementalIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-string-nulls");
+
+    results = runQuery(query, bob.tmpDir(tempFolder.newFolder()).buildMMappedIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-string-nulls");
+  }
+
+  @Test
+  public void testGroupByOnUnnestEmptyTable()
+  {
+    cannotVectorize();
+    IndexBuilder bob =
+        IndexBuilder.create()
+                    .rows(ImmutableList.of());
+
+    final DataSource unnestDataSource = UnnestDataSource.create(
+        new TableDataSource(QueryRunnerTestHelper.DATA_SOURCE),
+        new ExpressionVirtualColumn(
+            "v0",
+            "mvd",
+            ColumnType.STRING,
+            TestExprMacroTable.INSTANCE
+        ),
+        null
+    );
+
+    GroupByQuery query = makeQueryBuilder()
+        .setDataSource(unnestDataSource)
+        .setQuerySegmentSpec(new MultipleIntervalSegmentSpec(Collections.singletonList(Intervals.ETERNITY)))
+        .setDimensions(new DefaultDimensionSpec("v0", "v0"))
+        .setAggregatorSpecs(QueryRunnerTestHelper.ROWS_COUNT)
+        .setGranularity(QueryRunnerTestHelper.ALL_GRAN)
+        .build();
+
+    List<ResultRow> expectedResults = Collections.emptyList();
+
+    Iterable<ResultRow> results = runQuery(query, bob.buildIncrementalIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-empty");
+
+    // can only test realtime since empty cannot be persisted
+  }
+
+  @Test
+  public void testGroupByOnUnnestEmptyRows()
+  {
+    cannotVectorize();
+    final String dim = "mvd";
+    final DateTime timestamp = DateTimes.nowUtc();
+    final RowSignature signature = RowSignature.builder()
+                                               .add(dim, ColumnType.STRING)
+                                               .build();
+    List<String> dims = Collections.singletonList(dim);
+    IndexBuilder bob =
+        IndexBuilder.create()
+                    .schema(
+                        IncrementalIndexSchema.builder()
+                                              .withRollup(false)
+                                              .build()
+                    )
+                    .rows(
+                        ImmutableList.of(
+                            new ListBasedInputRow(signature, timestamp, dims, Collections.singletonList(Collections.emptyList()))
+                        )
+                    );
+
+    final DataSource unnestDataSource = UnnestDataSource.create(
+        new TableDataSource(QueryRunnerTestHelper.DATA_SOURCE),
+        new ExpressionVirtualColumn(
+            "v0",
+            "mvd",
+            ColumnType.STRING,
+            TestExprMacroTable.INSTANCE
+        ),
+        null
+    );
+
+    GroupByQuery query = makeQueryBuilder()
+        .setDataSource(unnestDataSource)
+        .setQuerySegmentSpec(new MultipleIntervalSegmentSpec(Collections.singletonList(Intervals.ETERNITY)))
+        .setDimensions(new DefaultDimensionSpec("v0", "v0"))
+        .setAggregatorSpecs(QueryRunnerTestHelper.ROWS_COUNT)
+        .setGranularity(QueryRunnerTestHelper.ALL_GRAN)
+        .build();
+
+    // make sure results are consistent with grouping directly on the column with implicit unnest
+    GroupByQuery regularQuery = makeQueryBuilder()
+        .setDataSource(new TableDataSource(QueryRunnerTestHelper.DATA_SOURCE))
+        .setQuerySegmentSpec(new MultipleIntervalSegmentSpec(Collections.singletonList(Intervals.ETERNITY)))
+        .setDimensions(new DefaultDimensionSpec("mvd", "v0"))
+        .setAggregatorSpecs(QueryRunnerTestHelper.ROWS_COUNT)
+        .setGranularity(QueryRunnerTestHelper.ALL_GRAN)
+        .build();
+
+    List<ResultRow> expectedResults = Collections.singletonList(
+        makeRow(query, timestamp, "v0", null, "rows", 1L)
+    );
+
+    Iterable<ResultRow> results = runQuery(query, bob.buildIncrementalIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-empty");
+
+    results = runQuery(regularQuery, bob.buildIncrementalIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-empty");
+
+    // can only test realtime since empty cannot be persisted
+  }
+
+  @Test
+  public void testGroupByOnUnnestedStringColumnDoubleUnnest() throws IOException
+  {
+    // not really a sane query to write, but it shouldn't behave differently than a single unnest
+    // the issue is that the dimension selector handles null differently than if arrays are used from a column value
+    // selector. the dimension selector cursor puts nulls in the output to be compatible with implict unnest used by
+    // group-by, while the column selector cursor
+    cannotVectorize();
+
+    final String dim = "mvd";
+    final DateTime timestamp = DateTimes.nowUtc();
+    final RowSignature signature = RowSignature.builder()
+                                               .add(dim, ColumnType.STRING)
+                                               .build();
+    List<String> dims = Collections.singletonList(dim);
+    IndexBuilder bob =
+        IndexBuilder.create()
+                    .schema(
+                        IncrementalIndexSchema.builder()
+                                              .withRollup(false)
+                                              .build()
+                    )
+                    .rows(
+                        ImmutableList.of(
+                            new ListBasedInputRow(signature, timestamp, dims, ImmutableList.of(ImmutableList.of("a", "b", "c"))),
+                            new ListBasedInputRow(signature, timestamp, dims, ImmutableList.of()),
+                            new ListBasedInputRow(signature, timestamp, dims, ImmutableList.of(ImmutableList.of())),
+                            new ListBasedInputRow(signature, timestamp, dims, ImmutableList.of(""))
+                        )
+                    );
+
+    final DataSource unnestDataSource = UnnestDataSource.create(
+        new TableDataSource(QueryRunnerTestHelper.DATA_SOURCE),
+        new ExpressionVirtualColumn(
+            "v0",
+            "mvd",
+            ColumnType.STRING,
+            TestExprMacroTable.INSTANCE
+        ),
+        null
+    );
+    final DataSource extraUnnested = UnnestDataSource.create(
+        unnestDataSource,
+        new ExpressionVirtualColumn(
+            "v1",
+            "v0",
+            ColumnType.STRING,
+            TestExprMacroTable.INSTANCE
+        ),
+        null
+    );
+
+    GroupByQuery query = makeQueryBuilder()
+        .setDataSource(extraUnnested)
+        .setQuerySegmentSpec(new MultipleIntervalSegmentSpec(Collections.singletonList(Intervals.ETERNITY)))
+        .setDimensions(new DefaultDimensionSpec("v1", "v1"))
+        .setAggregatorSpecs(QueryRunnerTestHelper.ROWS_COUNT)
+        .setGranularity(QueryRunnerTestHelper.ALL_GRAN)
+        .build();
+
+    List<ResultRow> expectedResults = NullHandling.sqlCompatible() ? Arrays.asList(
+        makeRow(query, timestamp, "v1", null, "rows", 2L),
+        makeRow(query, timestamp, "v1", "", "rows", 1L),
+        makeRow(query, timestamp, "v1", "a", "rows", 1L),
+        makeRow(query, timestamp, "v1", "b", "rows", 1L),
+        makeRow(query, timestamp, "v1", "c", "rows", 1L)
+    ) : Arrays.asList(
+        makeRow(query, timestamp, "v1", null, "rows", 3L),
+        makeRow(query, timestamp, "v1", "a", "rows", 1L),
+        makeRow(query, timestamp, "v1", "b", "rows", 1L),
+        makeRow(query, timestamp, "v1", "c", "rows", 1L)
+    );
+
+    Iterable<ResultRow> results = runQuery(query, bob.buildIncrementalIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-string-nulls-double-unnest");
+
+    results = runQuery(query, bob.tmpDir(tempFolder.newFolder()).buildMMappedIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "group-by-unnested-string-nulls-double-unnest");
   }
 
   @Test
@@ -751,6 +1083,9 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
 
     Iterable<ResultRow> results = runQuery(query, TestIndex.getIncrementalTestIndex());
     TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-virtual-column");
+
+    results = runQuery(query, TestIndex.getMMappedTestIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-virtual-column");
   }
 
   @Test
@@ -837,6 +1172,9 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
 
     Iterable<ResultRow> results = runQuery(query, TestIndex.getIncrementalTestIndex());
     TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-virtual-column");
+
+    results = runQuery(query, TestIndex.getMMappedTestIndex());
+    TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-virtual-column");
   }
 
   @Test
@@ -931,6 +1269,56 @@ public class UnnestGroupByQueryRunnerTest extends InitializedNullHandlingTest
     TestHelper.assertExpectedObjects(expectedResults, results, "groupBy-on-unnested-virtual-column");
   }
 
+
+  /**
+   * Use this method instead of makeQueryBuilder() to make sure the context is set properly. Also, avoid
+   * setContext in tests. Only use overrideContext.
+   */
+  private GroupByQuery.Builder makeQueryBuilder()
+  {
+    return GroupByQuery.builder().overrideContext(makeContext());
+  }
+
+  private Iterable<ResultRow> runQuery(final GroupByQuery query, final IncrementalIndex index)
+  {
+    final QueryRunner<?> queryRunner = factory.mergeRunners(
+        DirectQueryProcessingPool.INSTANCE,
+        Collections.singletonList(
+            QueryRunnerTestHelper.makeQueryRunnerWithSegmentMapFn(
+                factory,
+                new IncrementalIndexSegment(
+                    index,
+                    QueryRunnerTestHelper.SEGMENT_ID
+                ),
+                query,
+                "rtIndexvc"
+            )
+        )
+    );
+
+    return GroupByQueryRunnerTestHelper.runQuery(factory, queryRunner, query);
+  }
+
+  private Iterable<ResultRow> runQuery(final GroupByQuery query, QueryableIndex index)
+  {
+    final QueryRunner<?> queryRunner = factory.mergeRunners(
+        DirectQueryProcessingPool.INSTANCE,
+        Collections.singletonList(
+            QueryRunnerTestHelper.makeQueryRunnerWithSegmentMapFn(
+                factory,
+                new QueryableIndexSegment(
+                    index,
+                    QueryRunnerTestHelper.SEGMENT_ID
+                ),
+                query,
+                "mmapIndexvc"
+            )
+        )
+    );
+
+    return GroupByQueryRunnerTestHelper.runQuery(factory, queryRunner, query);
+  }
+
   private Map<String, Object> makeContext()
   {
     return ImmutableMap.<String, Object>builder()
diff --git a/processing/src/test/java/org/apache/druid/segment/UnnestStorageAdapterTest.java b/processing/src/test/java/org/apache/druid/segment/UnnestStorageAdapterTest.java
index 8dd81a94ce9..b467bc6c938 100644
--- a/processing/src/test/java/org/apache/druid/segment/UnnestStorageAdapterTest.java
+++ b/processing/src/test/java/org/apache/druid/segment/UnnestStorageAdapterTest.java
@@ -299,11 +299,12 @@ public class UnnestStorageAdapterTest extends InitializedNullHandlingTest
       }
       /*
       each row has 8 entries.
-      unnest 2 rows -> 16 entries also the value cardinality
+      unnest 2 rows -> 16 entries also the value cardinality, but null is not present in the dictionary and so is
+                       fabricated so cardinality is 17
       unnest of unnest -> 16*8 = 128 rows
        */
       Assert.assertEquals(count, 128);
-      Assert.assertEquals(dimSelector.getValueCardinality(), 16);
+      Assert.assertEquals(dimSelector.getValueCardinality(), 17);
       return null;
     });
   }

From 307b8849de89cc76a71b950404c1972b4ea0cbd2 Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Thu, 11 Jul 2024 14:45:04 -0700
Subject: [PATCH 59/72] Web console: better sql data loader reset (#16696)

* better sql data loader reset

* snapshot

* fix destination pane sizing

* clean doc links

* update doc links

* more doc links

* extract getClusterCapacity

* update snapsohts

* allow submit suspended

* some renaming

* diff with current

* Do delta
---
 docs/ingestion/supervisor.md                  |   1 +
 .../{azureStorage.png => azure-storage.png}   | Bin
 .../__snapshots__/header-bar.spec.tsx.snap    |   2 +-
 .../restricted-mode.spec.tsx.snap             |   4 +-
 .../restricted-mode/restricted-mode.tsx       |   2 +-
 .../supervisor-history-panel.tsx              |   8 +-
 web-console/src/console-application.tsx       |   5 +-
 .../__snapshots__/about-dialog.spec.tsx.snap  |   2 +-
 .../compaction-config-dialog.spec.tsx.snap    |   8 +-
 .../compaction-config-dialog.tsx              |   4 +-
 .../compaction-dynamic-config-dialog.tsx      |   4 +-
 .../compaction-history-dialog.tsx             |   4 +-
 .../coordinator-dynamic-config-dialog.tsx     |   4 +-
 .../src/dialogs/diff-dialog/diff-dialog.tsx   |  54 ++---
 .../dialogs/history-dialog/history-dialog.tsx |   4 +-
 .../overlord-dynamic-config-dialog.tsx        |   4 +-
 .../retention-dialog.spec.tsx.snap            |   2 +-
 .../retention-dialog/retention-dialog.tsx     |   2 +-
 .../supervisor-table-action-dialog.tsx        |   2 +-
 .../src/druid-models/execution/execution.ts   |   6 +
 .../src/druid-models/filter/filter.tsx        |   2 +-
 .../ingestion-spec/ingestion-spec.tsx         |  70 +++---
 .../input-format/input-format.tsx             |   4 +-
 .../input-source/input-source.tsx             |  20 +-
 .../druid-models/metric-spec/metric-spec.tsx  |   6 +-
 .../overlord-dynamic-config.tsx               |  12 ++
 .../timestamp-spec/timestamp-spec.tsx         |   2 +-
 .../transform-spec/transform-spec.tsx         |   6 +-
 web-console/src/helpers/capabilities.ts       |  14 +-
 .../helpers/execution/sql-task-execution.ts   |  12 +-
 web-console/src/helpers/spec-conversion.ts    |   4 +-
 web-console/src/hooks/use-query-manager.ts    |   2 +-
 web-console/src/links.ts                      |  10 +-
 web-console/src/utils/joda-to-regexp.ts       |   2 +-
 .../__snapshots__/home-view.spec.tsx.snap     |  30 +--
 .../load-data-view.spec.tsx.snap              |   2 +-
 .../views/load-data-view/info-messages.tsx    |  26 ++-
 .../views/load-data-view/load-data-view.scss  |   7 +
 .../views/load-data-view/load-data-view.tsx   | 202 ++++++++++++------
 .../ingestion-progress-dialog.tsx             |   7 +-
 .../schema-step/column-list/column-list.tsx   |   4 +-
 .../schema-step/schema-step.tsx               |   4 +-
 .../sql-data-loader-view.tsx                  |  25 ++-
 .../destination-pages-dialog.scss             |  10 +-
 .../destination-pages-dialog.tsx              |   7 +-
 .../destination-pages-pane.scss               |   7 +
 .../destination-pages-pane.tsx                |   2 +-
 .../execution-details-pane.spec.tsx.snap      |   4 +-
 .../execution-details-pane.scss               |  14 +-
 .../execution-details-pane.tsx                |   2 +-
 .../execution-error-pane.spec.tsx.snap        |   2 +-
 .../input-format-step/input-format-step.tsx   |   2 +-
 .../workbench-view/query-tab/query-tab.tsx    |   7 +-
 .../views/workbench-view/workbench-view.tsx   |  24 ++-
 54 files changed, 405 insertions(+), 271 deletions(-)
 rename web-console/assets/{azureStorage.png => azure-storage.png} (100%)

diff --git a/docs/ingestion/supervisor.md b/docs/ingestion/supervisor.md
index 9320c39a02a..70939adb633 100644
--- a/docs/ingestion/supervisor.md
+++ b/docs/ingestion/supervisor.md
@@ -42,6 +42,7 @@ The following table outlines the high-level configuration options for a supervis
 |`spec.dataSchema`|Object|The schema for the indexing task to use during ingestion. See [`dataSchema`](../ingestion/ingestion-spec.md#dataschema) for more information.|Yes|
 |`spec.ioConfig`|Object|The I/O configuration object to define the connection and I/O-related settings for the supervisor and indexing tasks.|Yes|
 |`spec.tuningConfig`|Object|The tuning configuration object to define performance-related settings for the supervisor and indexing tasks.|No|
+|`suspended`|Boolean|Puts the supervisor in a suspended state|No|
 
 ### I/O configuration
 
diff --git a/web-console/assets/azureStorage.png b/web-console/assets/azure-storage.png
similarity index 100%
rename from web-console/assets/azureStorage.png
rename to web-console/assets/azure-storage.png
diff --git a/web-console/src/components/header-bar/__snapshots__/header-bar.spec.tsx.snap b/web-console/src/components/header-bar/__snapshots__/header-bar.spec.tsx.snap
index 6c7cf34cb70..a189bf5f954 100644
--- a/web-console/src/components/header-bar/__snapshots__/header-bar.spec.tsx.snap
+++ b/web-console/src/components/header-bar/__snapshots__/header-bar.spec.tsx.snap
@@ -205,8 +205,8 @@ exports[`HeaderBar matches snapshot 1`] = `
     <Memo(RestrictedMode)
       capabilities={
         Capabilities {
-          "clusterCapacity": undefined,
           "coordinator": true,
+          "maxTaskSlots": undefined,
           "multiStageQuery": true,
           "overlord": true,
           "queryType": "nativeAndSql",
diff --git a/web-console/src/components/header-bar/restricted-mode/__snapshots__/restricted-mode.spec.tsx.snap b/web-console/src/components/header-bar/restricted-mode/__snapshots__/restricted-mode.spec.tsx.snap
index ed352ecbf5f..8a2e325815d 100644
--- a/web-console/src/components/header-bar/restricted-mode/__snapshots__/restricted-mode.spec.tsx.snap
+++ b/web-console/src/components/header-bar/restricted-mode/__snapshots__/restricted-mode.spec.tsx.snap
@@ -17,7 +17,7 @@ exports[`RestrictedMode matches snapshot when in auto capability detection mode
         For more info refer to the
          
         <Memo(ExternalLink)
-          href="https://druid.apache.org/docs/latest/operations/web-console.html"
+          href="https://druid.apache.org/docs/latest/operations/web-console"
         >
           web console documentation
         </Memo(ExternalLink)>
@@ -88,7 +88,7 @@ exports[`RestrictedMode matches snapshot when in manual capability detection mod
         For more info refer to the
          
         <Memo(ExternalLink)
-          href="https://druid.apache.org/docs/latest/operations/web-console.html"
+          href="https://druid.apache.org/docs/latest/operations/web-console"
         >
           web console documentation
         </Memo(ExternalLink)>
diff --git a/web-console/src/components/header-bar/restricted-mode/restricted-mode.tsx b/web-console/src/components/header-bar/restricted-mode/restricted-mode.tsx
index 072d5b10e58..d9b7e18a5ec 100644
--- a/web-console/src/components/header-bar/restricted-mode/restricted-mode.tsx
+++ b/web-console/src/components/header-bar/restricted-mode/restricted-mode.tsx
@@ -128,7 +128,7 @@ export const RestrictedMode = React.memo(function RestrictedMode(props: Restrict
           {message}
           <p>
             For more info refer to the{' '}
-            <ExternalLink href={`${getLink('DOCS')}/operations/web-console.html`}>
+            <ExternalLink href={`${getLink('DOCS')}/operations/web-console`}>
               web console documentation
             </ExternalLink>
             .
diff --git a/web-console/src/components/supervisor-history-panel/supervisor-history-panel.tsx b/web-console/src/components/supervisor-history-panel/supervisor-history-panel.tsx
index e3fd38b9161..0e1043a5681 100644
--- a/web-console/src/components/supervisor-history-panel/supervisor-history-panel.tsx
+++ b/web-console/src/components/supervisor-history-panel/supervisor-history-panel.tsx
@@ -52,9 +52,7 @@ export const SupervisorHistoryPanel = React.memo(function SupervisorHistoryPanel
       const resp = await Api.instance.get(
         `/druid/indexer/v1/supervisor/${Api.encodePath(supervisorId)}/history`,
       );
-      return resp.data.map((vs: SupervisorHistoryEntry) =>
-        deepSet(vs, 'spec', cleanSpec(vs.spec, true)),
-      );
+      return resp.data.map((vs: SupervisorHistoryEntry) => deepSet(vs, 'spec', cleanSpec(vs.spec)));
     },
   });
 
@@ -87,8 +85,8 @@ export const SupervisorHistoryPanel = React.memo(function SupervisorHistoryPanel
         <DiffDialog
           title="Supervisor spec diff"
           versions={historyData.map(s => ({ label: s.version, value: s.spec }))}
-          initLeftIndex={diffIndex + 1}
-          initRightIndex={diffIndex}
+          initOldIndex={diffIndex + 1}
+          initNewIndex={diffIndex}
           onClose={() => setDiffIndex(-1)}
         />
       )}
diff --git a/web-console/src/console-application.tsx b/web-console/src/console-application.tsx
index e500af23e5d..6acefa40e7f 100644
--- a/web-console/src/console-application.tsx
+++ b/web-console/src/console-application.tsx
@@ -29,7 +29,7 @@ import type { Filter } from 'react-table';
 import type { HeaderActiveTab } from './components';
 import { HeaderBar, Loader } from './components';
 import type { DruidEngine, QueryWithContext } from './druid-models';
-import { Capabilities } from './helpers';
+import { Capabilities, maybeGetClusterCapacity } from './helpers';
 import { stringToTableFilters, tableFiltersToString } from './react-table';
 import { AppToaster } from './singletons';
 import { compact, localStorageGetJson, LocalStorageKeys, QueryManager } from './utils';
@@ -318,6 +318,7 @@ export class ConsoleApplication extends React.PureComponent<
         queryEngines={queryEngines}
         allowExplain
         goToTask={this.goToTasksWithTaskId}
+        getClusterCapacity={maybeGetClusterCapacity}
       />,
       'thin',
     );
@@ -331,6 +332,8 @@ export class ConsoleApplication extends React.PureComponent<
         capabilities={capabilities}
         goToQuery={this.goToQuery}
         goToTask={this.goToTasksWithTaskId}
+        goToTaskGroup={this.goToTasksWithTaskGroupId}
+        getClusterCapacity={maybeGetClusterCapacity}
       />,
     );
   };
diff --git a/web-console/src/dialogs/about-dialog/__snapshots__/about-dialog.spec.tsx.snap b/web-console/src/dialogs/about-dialog/__snapshots__/about-dialog.spec.tsx.snap
index 9509dd1ecf9..7ea843d01df 100644
--- a/web-console/src/dialogs/about-dialog/__snapshots__/about-dialog.spec.tsx.snap
+++ b/web-console/src/dialogs/about-dialog/__snapshots__/about-dialog.spec.tsx.snap
@@ -109,7 +109,7 @@ exports[`AboutDialog matches snapshot 1`] = `
             Druid is made with ❤️ by a community of passionate developers. To contribute, join in the discussion on the
              
             <a
-              href="https://lists.apache.org/list.html?dev@druid.apache.org"
+              href="https://lists.apache.org/list?dev@druid.apache.org"
               rel="noopener noreferrer"
               target="_blank"
             >
diff --git a/web-console/src/dialogs/compaction-config-dialog/__snapshots__/compaction-config-dialog.spec.tsx.snap b/web-console/src/dialogs/compaction-config-dialog/__snapshots__/compaction-config-dialog.spec.tsx.snap
index 6df207060ff..30df7eeca2f 100644
--- a/web-console/src/dialogs/compaction-config-dialog/__snapshots__/compaction-config-dialog.spec.tsx.snap
+++ b/web-console/src/dialogs/compaction-config-dialog/__snapshots__/compaction-config-dialog.spec.tsx.snap
@@ -360,7 +360,7 @@ exports[`CompactionConfigDialog matches snapshot with compactionConfig (dynamic
               For more information refer to the
                
               <Memo(ExternalLink)
-                href="https://druid.apache.org/docs/latest/ingestion/concurrent-append-replace.html"
+                href="https://druid.apache.org/docs/latest/ingestion/concurrent-append-replace"
               >
                 documentation
               </Memo(ExternalLink)>
@@ -770,7 +770,7 @@ exports[`CompactionConfigDialog matches snapshot with compactionConfig (hashed p
               For more information refer to the
                
               <Memo(ExternalLink)
-                href="https://druid.apache.org/docs/latest/ingestion/concurrent-append-replace.html"
+                href="https://druid.apache.org/docs/latest/ingestion/concurrent-append-replace"
               >
                 documentation
               </Memo(ExternalLink)>
@@ -1180,7 +1180,7 @@ exports[`CompactionConfigDialog matches snapshot with compactionConfig (range pa
               For more information refer to the
                
               <Memo(ExternalLink)
-                href="https://druid.apache.org/docs/latest/ingestion/concurrent-append-replace.html"
+                href="https://druid.apache.org/docs/latest/ingestion/concurrent-append-replace"
               >
                 documentation
               </Memo(ExternalLink)>
@@ -1590,7 +1590,7 @@ exports[`CompactionConfigDialog matches snapshot without compactionConfig 1`] =
               For more information refer to the
                
               <Memo(ExternalLink)
-                href="https://druid.apache.org/docs/latest/ingestion/concurrent-append-replace.html"
+                href="https://druid.apache.org/docs/latest/ingestion/concurrent-append-replace"
               >
                 documentation
               </Memo(ExternalLink)>
diff --git a/web-console/src/dialogs/compaction-config-dialog/compaction-config-dialog.tsx b/web-console/src/dialogs/compaction-config-dialog/compaction-config-dialog.tsx
index f07d0ce55ec..985430755c7 100644
--- a/web-console/src/dialogs/compaction-config-dialog/compaction-config-dialog.tsx
+++ b/web-console/src/dialogs/compaction-config-dialog/compaction-config-dialog.tsx
@@ -122,9 +122,7 @@ export const CompactionConfigDialog = React.memo(function CompactionConfigDialog
                   </p>
                   <p>
                     For more information refer to the{' '}
-                    <ExternalLink
-                      href={`${getLink('DOCS')}/ingestion/concurrent-append-replace.html`}
-                    >
+                    <ExternalLink href={`${getLink('DOCS')}/ingestion/concurrent-append-replace`}>
                       documentation
                     </ExternalLink>
                     .
diff --git a/web-console/src/dialogs/compaction-dynamic-config-dialog/compaction-dynamic-config-dialog.tsx b/web-console/src/dialogs/compaction-dynamic-config-dialog/compaction-dynamic-config-dialog.tsx
index 59f73c27a11..be5234b5bdb 100644
--- a/web-console/src/dialogs/compaction-dynamic-config-dialog/compaction-dynamic-config-dialog.tsx
+++ b/web-console/src/dialogs/compaction-dynamic-config-dialog/compaction-dynamic-config-dialog.tsx
@@ -86,7 +86,7 @@ export const CompactionDynamicConfigDialog = React.memo(function CompactionDynam
   async function saveConfig() {
     if (!dynamicConfig) return;
     try {
-      // This API is terrible. https://druid.apache.org/docs/latest/operations/api-reference.html#automatic-compaction-configuration
+      // This API is terrible. https://druid.apache.org/docs/latest/operations/api-reference#automatic-compaction-configuration
       await Api.instance.post(
         `/druid/coordinator/v1/config/compaction/taskslots?ratio=${
           dynamicConfig.compactionTaskSlotRatio ?? DEFAULT_RATIO
@@ -124,7 +124,7 @@ export const CompactionDynamicConfigDialog = React.memo(function CompactionDynam
               <ExternalLink
                 href={`${getLink(
                   'DOCS',
-                )}/operations/api-reference.html#automatic-compaction-configuration`}
+                )}/operations/api-reference#automatic-compaction-configuration`}
               >
                 documentation
               </ExternalLink>
diff --git a/web-console/src/dialogs/compaction-history-dialog/compaction-history-dialog.tsx b/web-console/src/dialogs/compaction-history-dialog/compaction-history-dialog.tsx
index cb886d0483d..45234c68ad2 100644
--- a/web-console/src/dialogs/compaction-history-dialog/compaction-history-dialog.tsx
+++ b/web-console/src/dialogs/compaction-history-dialog/compaction-history-dialog.tsx
@@ -135,8 +135,8 @@ export const CompactionHistoryDialog = React.memo(function CompactionHistoryDial
         <DiffDialog
           title="Compaction config diff"
           versions={historyData.map(s => ({ label: s.auditTime, value: s.compactionConfig }))}
-          initLeftIndex={diffIndex + 1}
-          initRightIndex={diffIndex}
+          initOldIndex={diffIndex + 1}
+          initNewIndex={diffIndex}
           onClose={() => setDiffIndex(-1)}
         />
       )}
diff --git a/web-console/src/dialogs/coordinator-dynamic-config-dialog/coordinator-dynamic-config-dialog.tsx b/web-console/src/dialogs/coordinator-dynamic-config-dialog/coordinator-dynamic-config-dialog.tsx
index b31f774d88b..3caa2c71b74 100644
--- a/web-console/src/dialogs/coordinator-dynamic-config-dialog/coordinator-dynamic-config-dialog.tsx
+++ b/web-console/src/dialogs/coordinator-dynamic-config-dialog/coordinator-dynamic-config-dialog.tsx
@@ -107,9 +107,7 @@ export const CoordinatorDynamicConfigDialog = React.memo(function CoordinatorDyn
           <p>
             Edit the coordinator dynamic configuration on the fly. For more information please refer
             to the{' '}
-            <ExternalLink
-              href={`${getLink('DOCS')}/configuration/index.html#dynamic-configuration`}
-            >
+            <ExternalLink href={`${getLink('DOCS')}/configuration/#dynamic-configuration`}>
               documentation
             </ExternalLink>
             .
diff --git a/web-console/src/dialogs/diff-dialog/diff-dialog.tsx b/web-console/src/dialogs/diff-dialog/diff-dialog.tsx
index bb42f1db847..011bbfa5d38 100644
--- a/web-console/src/dialogs/diff-dialog/diff-dialog.tsx
+++ b/web-console/src/dialogs/diff-dialog/diff-dialog.tsx
@@ -44,43 +44,47 @@ export interface DiffVersion {
 
 export interface DiffDialogProps {
   title?: string;
-  left?: unknown;
-  right?: unknown;
+  onClose(): void;
+
+  // Single value
+  oldValue?: unknown;
+  newValue?: unknown;
+
+  // Versions
   versions?: DiffVersion[];
-  initLeftIndex?: number;
-  initRightIndex?: number;
-  onClose: () => void;
+  initOldIndex?: number;
+  initNewIndex?: number;
 }
 
 export const DiffDialog = React.memo(function DiffDialog(props: DiffDialogProps) {
-  const { title, left, right, versions, initLeftIndex, initRightIndex, onClose } = props;
+  const { title, oldValue, newValue, versions, initOldIndex, initNewIndex, onClose } = props;
 
-  const [leftIndex, setLeftIndex] = useState(initLeftIndex || 0);
-  const [rightIndex, setRightIndex] = useState(initRightIndex || 0);
+  const [leftIndex, setLeftIndex] = useState(initOldIndex || 0);
+  const [rightIndex, setRightIndex] = useState(initNewIndex || 0);
 
-  let leftValue: string;
-  let rightValue: string;
+  let oldValueString: string;
+  let newValueString: string;
   if (Array.isArray(versions)) {
     if (versions.length) {
-      const leftVersion = versions[leftIndex].value;
-      const rightVersion = versions[rightIndex].value;
-      if (typeof leftVersion === 'string' && typeof rightVersion === 'string') {
-        leftValue = leftVersion;
-        rightValue = rightVersion;
+      const oldVersionValue = versions[leftIndex].value;
+      const newVersionValue = versions[rightIndex].value;
+      if (typeof oldVersionValue === 'string' && typeof newVersionValue === 'string') {
+        oldValueString = oldVersionValue;
+        newValueString = newVersionValue;
       } else {
-        leftValue = JSONBig.stringify(leftVersion, undefined, 2);
-        rightValue = JSONBig.stringify(rightVersion, undefined, 2);
+        oldValueString = JSONBig.stringify(oldVersionValue, undefined, 2);
+        newValueString = JSONBig.stringify(newVersionValue, undefined, 2);
       }
     } else {
-      leftValue = rightValue = 'Nothing to diff';
+      oldValueString = newValueString = 'Nothing to diff';
     }
   } else {
-    if (typeof left === 'string' && typeof right === 'string') {
-      leftValue = left;
-      rightValue = right;
+    if (typeof oldValue === 'string' && typeof newValue === 'string') {
+      oldValueString = oldValue;
+      newValueString = newValue;
     } else {
-      leftValue = JSONBig.stringify(left, undefined, 2);
-      rightValue = JSONBig.stringify(right, undefined, 2);
+      oldValueString = JSONBig.stringify(oldValue, undefined, 2);
+      newValueString = JSONBig.stringify(newValue, undefined, 2);
     }
   }
 
@@ -121,8 +125,8 @@ export const DiffDialog = React.memo(function DiffDialog(props: DiffDialogProps)
         )}
         <div className="diff-container">
           <ReactDiffViewer
-            oldValue={leftValue}
-            newValue={rightValue}
+            oldValue={oldValueString}
+            newValue={newValueString}
             splitView
             useDarkTheme
             styles={REACT_DIFF_STYLES}
diff --git a/web-console/src/dialogs/history-dialog/history-dialog.tsx b/web-console/src/dialogs/history-dialog/history-dialog.tsx
index d204f316d3e..404e2fd273e 100644
--- a/web-console/src/dialogs/history-dialog/history-dialog.tsx
+++ b/web-console/src/dialogs/history-dialog/history-dialog.tsx
@@ -96,8 +96,8 @@ export const HistoryDialog = React.memo(function HistoryDialog(props: HistoryDia
           label: auditInfo.comment || auditTime,
           value: normalizePayload(payload),
         }))}
-        initLeftIndex={diffIndex + 1}
-        initRightIndex={diffIndex}
+        initOldIndex={diffIndex + 1}
+        initNewIndex={diffIndex}
         onClose={() => setDiffIndex(-1)}
       />
     );
diff --git a/web-console/src/dialogs/overlord-dynamic-config-dialog/overlord-dynamic-config-dialog.tsx b/web-console/src/dialogs/overlord-dynamic-config-dialog/overlord-dynamic-config-dialog.tsx
index 109901a71b2..64e5a6d168a 100644
--- a/web-console/src/dialogs/overlord-dynamic-config-dialog/overlord-dynamic-config-dialog.tsx
+++ b/web-console/src/dialogs/overlord-dynamic-config-dialog/overlord-dynamic-config-dialog.tsx
@@ -107,9 +107,7 @@ export const OverlordDynamicConfigDialog = React.memo(function OverlordDynamicCo
           <p>
             Edit the overlord dynamic configuration at runtime. For more information please refer to
             the{' '}
-            <ExternalLink
-              href={`${getLink('DOCS')}/configuration/index.html#overlord-dynamic-configuration`}
-            >
+            <ExternalLink href={`${getLink('DOCS')}/configuration/#overlord-dynamic-configuration`}>
               documentation
             </ExternalLink>
             .
diff --git a/web-console/src/dialogs/retention-dialog/__snapshots__/retention-dialog.spec.tsx.snap b/web-console/src/dialogs/retention-dialog/__snapshots__/retention-dialog.spec.tsx.snap
index 68fe45ae1b5..c22b1563155 100644
--- a/web-console/src/dialogs/retention-dialog/__snapshots__/retention-dialog.spec.tsx.snap
+++ b/web-console/src/dialogs/retention-dialog/__snapshots__/retention-dialog.spec.tsx.snap
@@ -64,7 +64,7 @@ exports[`RetentionDialog matches snapshot 1`] = `
             Druid uses rules to determine what data should be retained in the cluster. The rules are evaluated in order from top to bottom. For more information please refer to the
              
             <a
-              href="https://druid.apache.org/docs/latest/operations/rule-configuration.html"
+              href="https://druid.apache.org/docs/latest/operations/rule-configuration"
               rel="noopener noreferrer"
               target="_blank"
             >
diff --git a/web-console/src/dialogs/retention-dialog/retention-dialog.tsx b/web-console/src/dialogs/retention-dialog/retention-dialog.tsx
index 677173cc6d3..cc9645bd79f 100644
--- a/web-console/src/dialogs/retention-dialog/retention-dialog.tsx
+++ b/web-console/src/dialogs/retention-dialog/retention-dialog.tsx
@@ -129,7 +129,7 @@ ORDER BY 1`,
       <p>
         Druid uses rules to determine what data should be retained in the cluster. The rules are
         evaluated in order from top to bottom. For more information please refer to the{' '}
-        <ExternalLink href={`${getLink('DOCS')}/operations/rule-configuration.html`}>
+        <ExternalLink href={`${getLink('DOCS')}/operations/rule-configuration`}>
           documentation
         </ExternalLink>
         .
diff --git a/web-console/src/dialogs/supervisor-table-action-dialog/supervisor-table-action-dialog.tsx b/web-console/src/dialogs/supervisor-table-action-dialog/supervisor-table-action-dialog.tsx
index 5e3d9e50028..44ef05d5d59 100644
--- a/web-console/src/dialogs/supervisor-table-action-dialog/supervisor-table-action-dialog.tsx
+++ b/web-console/src/dialogs/supervisor-table-action-dialog/supervisor-table-action-dialog.tsx
@@ -93,7 +93,7 @@ export const SupervisorTableActionDialog = React.memo(function SupervisorTableAc
       {activeTab === 'spec' && (
         <ShowJson
           endpoint={supervisorEndpointBase}
-          transform={x => cleanSpec(x, true)}
+          transform={cleanSpec}
           downloadFilename={`supervisor-payload-${supervisorId}.json`}
         />
       )}
diff --git a/web-console/src/druid-models/execution/execution.ts b/web-console/src/druid-models/execution/execution.ts
index 799de6f9c51..dcb5b2d1b93 100644
--- a/web-console/src/druid-models/execution/execution.ts
+++ b/web-console/src/druid-models/execution/execution.ts
@@ -18,6 +18,7 @@
 
 import { Column, QueryResult, SqlExpression, SqlQuery, SqlWithQuery } from '@druid-toolkit/query';
 
+import { maybeGetClusterCapacity } from '../../helpers';
 import {
   deepGet,
   deleteKeys,
@@ -192,8 +193,13 @@ export interface ExecutionValue {
 }
 
 export class Execution {
+  static USE_TASK_PAYLOAD = true;
+  static USE_TASK_REPORTS = true;
   static INLINE_DATASOURCE_MARKER = '__query_select';
 
+  static getClusterCapacity: (() => Promise<CapacityInfo | undefined>) | undefined =
+    maybeGetClusterCapacity;
+
   static validAsyncState(status: string | undefined): status is AsyncState {
     return oneOf(status, 'ACCEPTED', 'RUNNING', 'FINISHED', 'FAILED');
   }
diff --git a/web-console/src/druid-models/filter/filter.tsx b/web-console/src/druid-models/filter/filter.tsx
index a7fd317197b..41f0d09ca85 100644
--- a/web-console/src/druid-models/filter/filter.tsx
+++ b/web-console/src/druid-models/filter/filter.tsx
@@ -170,7 +170,7 @@ export const FILTERS_FIELDS: Field<IngestionSpec>[] = [
       <>
         <p>
           A Druid{' '}
-          <ExternalLink href={`${getLink('DOCS')}/querying/filters.html`}>
+          <ExternalLink href={`${getLink('DOCS')}/querying/filters`}>
             JSON filter expression
           </ExternalLink>{' '}
           to apply to the data.
diff --git a/web-console/src/druid-models/ingestion-spec/ingestion-spec.tsx b/web-console/src/druid-models/ingestion-spec/ingestion-spec.tsx
index 2705614571d..d51fd34e901 100644
--- a/web-console/src/druid-models/ingestion-spec/ingestion-spec.tsx
+++ b/web-console/src/druid-models/ingestion-spec/ingestion-spec.tsx
@@ -212,8 +212,10 @@ export function getIngestionTitle(ingestionType: IngestionComboTypeWithExtra): s
 
 export function getIngestionImage(ingestionType: IngestionComboTypeWithExtra): string {
   const parts = ingestionType.split(':');
-  if (parts.length === 2) return parts[1];
-  return ingestionType;
+  return parts[parts.length - 1]
+    .split(/(?=[A-Z])/)
+    .join('-')
+    .toLowerCase();
 }
 
 export function getIngestionDocLink(spec: Partial<IngestionSpec>): string {
@@ -221,13 +223,13 @@ export function getIngestionDocLink(spec: Partial<IngestionSpec>): string {
 
   switch (type) {
     case 'kafka':
-      return `${getLink('DOCS')}/development/extensions-core/kafka-ingestion.html`;
+      return `${getLink('DOCS')}/ingestion/kafka-ingestion`;
 
     case 'kinesis':
-      return `${getLink('DOCS')}/development/extensions-core/kinesis-ingestion.html`;
+      return `${getLink('DOCS')}/ingestion/kinesis-ingestion`;
 
     default:
-      return `${getLink('DOCS')}/ingestion/native-batch.html#input-sources`;
+      return `${getLink('DOCS')}/ingestion/input-sources`;
   }
 }
 
@@ -476,16 +478,9 @@ export function normalizeSpec(spec: Partial<IngestionSpec>): IngestionSpec {
 /**
  * Make sure that any extra junk in the spec other than 'type', 'spec', and 'context' is removed
  * @param spec - the spec to clean
- * @param allowSuspended - allow keeping 'suspended' also
  */
-export function cleanSpec(
-  spec: Partial<IngestionSpec>,
-  allowSuspended?: boolean,
-): Partial<IngestionSpec> {
-  return allowKeys(
-    spec,
-    ['type', 'spec', 'context'].concat(allowSuspended ? ['suspended'] : []) as any,
-  ) as IngestionSpec;
+export function cleanSpec(spec: Partial<IngestionSpec>): Partial<IngestionSpec> {
+  return allowKeys(spec, ['type', 'spec', 'context', 'suspended']) as IngestionSpec;
 }
 
 export function upgradeSpec(spec: any, yolo = false): Partial<IngestionSpec> {
@@ -583,7 +578,7 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
     info: (
       <p>
         Druid connects to raw data through{' '}
-        <ExternalLink href={`${getLink('DOCS')}/ingestion/native-batch.html#input-sources`}>
+        <ExternalLink href={`${getLink('DOCS')}/ingestion/input-sources`}>
           inputSources
         </ExternalLink>
         . You can change your selected inputSource here.
@@ -608,7 +603,7 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
         </p>
         <p>
           For more information, refer to the documentation for{' '}
-          <ExternalLink href="https://docs.oracle.com/javase/8/docs/api/java/nio/file/FileSystem.html#getPathMatcher-java.lang.String-">
+          <ExternalLink href="https://docs.oracle.com/javase/8/docs/api/java/nio/file/FileSystem#getPathMatcher-java.lang.String-">
             FileSystem#getPathMatcher
           </ExternalLink>
           .
@@ -662,7 +657,7 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
           required: true,
           info: (
             <>
-              <ExternalLink href={`${getLink('DOCS')}/ingestion/native-batch.html#input-sources`}>
+              <ExternalLink href={`${getLink('DOCS')}/ingestion/input-sources`}>
                 inputSource.baseDir
               </ExternalLink>
               <p>Specifies the directory to search recursively for files to be ingested.</p>
@@ -677,14 +672,12 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
           suggestions: FILTER_SUGGESTIONS,
           info: (
             <>
-              <ExternalLink
-                href={`${getLink('DOCS')}/ingestion/native-batch.html#local-input-source`}
-              >
+              <ExternalLink href={`${getLink('DOCS')}/ingestion/native-batch#local-input-source`}>
                 inputSource.filter
               </ExternalLink>
               <p>
                 A wildcard filter for files. See{' '}
-                <ExternalLink href="https://commons.apache.org/proper/commons-io/apidocs/org/apache/commons/io/filefilter/WildcardFileFilter.html">
+                <ExternalLink href="https://commons.apache.org/proper/commons-io/apidocs/org/apache/commons/io/filefilter/WildcardFileFilter">
                   here
                 </ExternalLink>{' '}
                 for format information. Files matching the filter criteria are considered for
@@ -726,8 +719,7 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
           hideInMore: true,
           info: (
             <p>
-              The{' '}
-              <ExternalLink href={`${getLink('DOCS')}/querying/filters.html`}>filter</ExternalLink>{' '}
+              The <ExternalLink href={`${getLink('DOCS')}/querying/filters`}>filter</ExternalLink>{' '}
               to apply to the data as part of querying.
             </p>
           ),
@@ -787,7 +779,7 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
             <>
               <p>
                 JSON array of{' '}
-                <ExternalLink href={`${getLink('DOCS')}/development/extensions-core/s3.html`}>
+                <ExternalLink href={`${getLink('DOCS')}/ingestion/input-sources#s3-input-source`}>
                   S3 Objects
                 </ExternalLink>
                 .
@@ -950,7 +942,9 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
             <>
               <p>
                 JSON array of{' '}
-                <ExternalLink href={`${getLink('DOCS')}/development/extensions-core/azure.html`}>
+                <ExternalLink
+                  href={`${getLink('DOCS')}/ingestion/input-sources#azure-input-source`}
+                >
                   S3 Objects
                 </ExternalLink>
                 .
@@ -1024,7 +1018,11 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
             <>
               <p>
                 JSON array of{' '}
-                <ExternalLink href={`${getLink('DOCS')}/development/extensions-core/google.html`}>
+                <ExternalLink
+                  href={`${getLink(
+                    'DOCS',
+                  )}/ingestion/input-sources#google-cloud-storage-input-source`}
+                >
                   Google Cloud Storage Objects
                 </ExternalLink>
                 .
@@ -1091,11 +1089,7 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
           placeholder: 'kafka_broker_host:9092',
           info: (
             <>
-              <ExternalLink
-                href={`${getLink(
-                  'DOCS',
-                )}/development/extensions-core/kafka-ingestion#supervisor-io-configuration`}
-              >
+              <ExternalLink href={`${getLink('DOCS')}/ingestion/kafka-ingestion#io-configuration`}>
                 consumerProperties
               </ExternalLink>
               <p>
@@ -1141,11 +1135,7 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
           defaultValue: {},
           info: (
             <>
-              <ExternalLink
-                href={`${getLink(
-                  'DOCS',
-                )}/development/extensions-core/kafka-ingestion#supervisor-io-configuration`}
-              >
+              <ExternalLink href={`${getLink('DOCS')}/ingestion/kafka-ingestion#io-configuration`}>
                 consumerProperties
               </ExternalLink>
               <p>A map of properties to be passed to the Kafka consumer.</p>
@@ -1254,7 +1244,7 @@ export function getIoConfigFormFields(ingestionComboType: IngestionComboType): F
           info: (
             <>
               The Amazon Kinesis stream endpoint for a region. You can find a list of endpoints{' '}
-              <ExternalLink href="https://docs.aws.amazon.com/general/latest/gr/ak.html">
+              <ExternalLink href="https://docs.aws.amazon.com/general/latest/gr/ak">
                 here
               </ExternalLink>
               .
@@ -1884,7 +1874,9 @@ export function getSecondaryPartitionRelatedFormFields(
               <p>
                 This should be the first dimension in your schema which would make it first in the
                 sort order. As{' '}
-                <ExternalLink href={`${getLink('DOCS')}/ingestion/index.html#why-partition`}>
+                <ExternalLink
+                  href={`${getLink('DOCS')}/ingestion/partitioning#partitioning-and-sorting`}
+                >
                   Partitioning and sorting are best friends!
                 </ExternalLink>
               </p>
@@ -2511,7 +2503,7 @@ export function guessSimpleInputFormat(
     if (sampleDatum.startsWith('ORC')) {
       return inputFormatFromType({ type: 'orc' });
     }
-    // Avro OCF 4 byte magic header: https://avro.apache.org/docs/current/spec.html#Object+Container+Files
+    // Avro OCF 4 byte magic header: https://avro.apache.org/docs/current/spec#Object+Container+Files
     if (sampleDatum.startsWith('Obj\x01')) {
       return inputFormatFromType({ type: 'avro_ocf' });
     }
diff --git a/web-console/src/druid-models/input-format/input-format.tsx b/web-console/src/druid-models/input-format/input-format.tsx
index 7692a62a7a4..a5a1fbdfa07 100644
--- a/web-console/src/druid-models/input-format/input-format.tsx
+++ b/web-console/src/druid-models/input-format/input-format.tsx
@@ -76,7 +76,7 @@ function generateInputFormatFields(streaming: boolean) {
           <p>The parser used to parse the data.</p>
           <p>
             For more information see{' '}
-            <ExternalLink href={`${getLink('DOCS')}/ingestion/data-formats.html`}>
+            <ExternalLink href={`${getLink('DOCS')}/ingestion/data-formats`}>
               the documentation
             </ExternalLink>
             .
@@ -329,7 +329,7 @@ export const KAFKA_METADATA_INPUT_FORMAT_FIELDS: Field<InputFormat>[] = [
         <p>The parser used to parse the key of the Kafka message.</p>
         <p>
           For more information see{' '}
-          <ExternalLink href={`${getLink('DOCS')}/ingestion/data-formats.html`}>
+          <ExternalLink href={`${getLink('DOCS')}/ingestion/data-formats`}>
             the documentation
           </ExternalLink>
           .
diff --git a/web-console/src/druid-models/input-source/input-source.tsx b/web-console/src/druid-models/input-source/input-source.tsx
index 174f8aba516..4479150227d 100644
--- a/web-console/src/druid-models/input-source/input-source.tsx
+++ b/web-console/src/druid-models/input-source/input-source.tsx
@@ -97,7 +97,7 @@ export type InputSourceDesc =
       dataSource: string;
       interval: string;
       filter?: any;
-      dimensions?: string[]; // ToDo: these are not in the docs https://druid.apache.org/docs/latest/ingestion/input-sources.html
+      dimensions?: string[]; // ToDo: these are not in the docs https://druid.apache.org/docs/latest/ingestion/input-sources
       metrics?: string[];
       maxInputSegmentBytesPerTask?: number;
     }
@@ -264,9 +264,7 @@ export const INPUT_SOURCE_FIELDS: Field<InputSource>[] = [
     required: true,
     info: (
       <>
-        <ExternalLink href={`${getLink('DOCS')}/ingestion/native-batch.html#input-sources`}>
-          baseDir
-        </ExternalLink>
+        <ExternalLink href={`${getLink('DOCS')}/ingestion/input-sources`}>baseDir</ExternalLink>
         <p>Specifies the directory to search recursively for files to be ingested.</p>
       </>
     ),
@@ -280,12 +278,12 @@ export const INPUT_SOURCE_FIELDS: Field<InputSource>[] = [
     suggestions: FILTER_SUGGESTIONS,
     info: (
       <>
-        <ExternalLink href={`${getLink('DOCS')}/ingestion/native-batch.html#local-input-source`}>
+        <ExternalLink href={`${getLink('DOCS')}/ingestion/native-batch#local-input-source`}>
           filter
         </ExternalLink>
         <p>
           A wildcard filter for files. See{' '}
-          <ExternalLink href="https://commons.apache.org/proper/commons-io/apidocs/org/apache/commons/io/filefilter/WildcardFileFilter.html">
+          <ExternalLink href="https://commons.apache.org/proper/commons-io/apidocs/org/apache/commons/io/filefilter/WildcardFileFilter">
             here
           </ExternalLink>{' '}
           for format information.
@@ -344,7 +342,7 @@ export const INPUT_SOURCE_FIELDS: Field<InputSource>[] = [
       <>
         <p>
           JSON array of{' '}
-          <ExternalLink href={`${getLink('DOCS')}/development/extensions-core/s3.html`}>
+          <ExternalLink href={`${getLink('DOCS')}/ingestion/input-sources#s3-input-source`}>
             S3 Objects
           </ExternalLink>
           .
@@ -406,7 +404,7 @@ export const INPUT_SOURCE_FIELDS: Field<InputSource>[] = [
       <>
         <p>
           JSON array of{' '}
-          <ExternalLink href={`${getLink('DOCS')}/development/extensions-core/azure.html`}>
+          <ExternalLink href={`${getLink('DOCS')}/ingestion/input-sources#azure-input-source`}>
             S3 Objects
           </ExternalLink>
           .
@@ -480,7 +478,9 @@ export const INPUT_SOURCE_FIELDS: Field<InputSource>[] = [
       <>
         <p>
           JSON array of{' '}
-          <ExternalLink href={`${getLink('DOCS')}/development/extensions-core/google.html`}>
+          <ExternalLink
+            href={`${getLink('DOCS')}/ingestion/input-sources#google-cloud-storage-input-source`}
+          >
             Google Cloud Storage Objects
           </ExternalLink>
           .
@@ -508,7 +508,7 @@ export const INPUT_SOURCE_FIELDS: Field<InputSource>[] = [
         </p>
         <p>
           For more information, refer to the documentation for{' '}
-          <ExternalLink href="https://docs.oracle.com/javase/8/docs/api/java/nio/file/FileSystem.html#getPathMatcher-java.lang.String-">
+          <ExternalLink href="https://docs.oracle.com/javase/8/docs/api/java/nio/file/FileSystem#getPathMatcher-java.lang.String-">
             FileSystem#getPathMatcher
           </ExternalLink>
           .
diff --git a/web-console/src/druid-models/metric-spec/metric-spec.tsx b/web-console/src/druid-models/metric-spec/metric-spec.tsx
index 367f922ca48..f8dbfd96443 100644
--- a/web-console/src/druid-models/metric-spec/metric-spec.tsx
+++ b/web-console/src/druid-models/metric-spec/metric-spec.tsx
@@ -201,7 +201,7 @@ export const METRIC_SPEC_FIELDS: Field<MetricSpec>[] = [
         </p>
         <p>
           See the{' '}
-          <ExternalLink href="https://datasketches.apache.org/docs/Theta/ThetaSize.html">
+          <ExternalLink href="https://datasketches.apache.org/docs/Theta/ThetaSize">
             DataSketches site
           </ExternalLink>{' '}
           for details.
@@ -307,7 +307,7 @@ export const METRIC_SPEC_FIELDS: Field<MetricSpec>[] = [
         </p>
         <p>
           Must be a power of 2 from 2 to 32768. See the{' '}
-          <ExternalLink href="https://datasketches.apache.org/docs/Quantiles/QuantilesAccuracy.html">
+          <ExternalLink href="https://datasketches.apache.org/docs/Quantiles/QuantilesAccuracy">
             Quantiles Accuracy
           </ExternalLink>{' '}
           for details.
@@ -385,7 +385,7 @@ export const METRIC_SPEC_FIELDS: Field<MetricSpec>[] = [
           <ExternalLink
             href={`${getLink(
               'DOCS',
-            )}/development/extensions-core/approximate-histograms.html#outlier-handling-modes`}
+            )}/development/extensions-core/approximate-histograms#outlier-handling-modes`}
           >
             outlier handling modes
           </ExternalLink>{' '}
diff --git a/web-console/src/druid-models/overlord-dynamic-config/overlord-dynamic-config.tsx b/web-console/src/druid-models/overlord-dynamic-config/overlord-dynamic-config.tsx
index 63ebb938191..3c4060e5621 100644
--- a/web-console/src/druid-models/overlord-dynamic-config/overlord-dynamic-config.tsx
+++ b/web-console/src/druid-models/overlord-dynamic-config/overlord-dynamic-config.tsx
@@ -20,6 +20,8 @@ import { Callout } from '@blueprintjs/core';
 import React from 'react';
 
 import type { Field } from '../../components';
+import { ExternalLink } from '../../components';
+import { getLink } from '../../links';
 import { deepGet, oneOf } from '../../utils';
 
 export interface OverlordDynamicConfig {
@@ -92,6 +94,11 @@ export const OVERLORD_DYNAMIC_CONFIG_FIELDS: Field<OverlordDynamicConfig>[] = [
   "datasource2": ["host3:port"]
 }`}
         </Callout>
+        <p>
+          <ExternalLink href={`${getLink('DOCS')}/configuration/#affinityconfig`}>
+            Learn more
+          </ExternalLink>
+        </p>
       </>
     ),
   },
@@ -131,6 +138,11 @@ export const OVERLORD_DYNAMIC_CONFIG_FIELDS: Field<OverlordDynamicConfig>[] = [
   }
 }`}
         </Callout>
+        <p>
+          <ExternalLink href={`${getLink('DOCS')}/configuration/#workercategoryspec`}>
+            Learn more
+          </ExternalLink>
+        </p>
       </>
     ),
   },
diff --git a/web-console/src/druid-models/timestamp-spec/timestamp-spec.tsx b/web-console/src/druid-models/timestamp-spec/timestamp-spec.tsx
index a88ffc3d0ef..07ef6ade3ff 100644
--- a/web-console/src/druid-models/timestamp-spec/timestamp-spec.tsx
+++ b/web-console/src/druid-models/timestamp-spec/timestamp-spec.tsx
@@ -138,7 +138,7 @@ export const TIMESTAMP_SPEC_FIELDS: Field<TimestampSpec>[] = [
     info: (
       <p>
         Specify your timestamp format by using the suggestions menu or typing in a{' '}
-        <ExternalLink href="https://docs.oracle.com/javase/8/docs/api/java/time/format/DateTimeFormatter.html">
+        <ExternalLink href="https://docs.oracle.com/javase/8/docs/api/java/time/format/DateTimeFormatter">
           format string
         </ExternalLink>
         .
diff --git a/web-console/src/druid-models/transform-spec/transform-spec.tsx b/web-console/src/druid-models/transform-spec/transform-spec.tsx
index ffb90d2226e..cf8224d90f1 100644
--- a/web-console/src/druid-models/transform-spec/transform-spec.tsx
+++ b/web-console/src/druid-models/transform-spec/transform-spec.tsx
@@ -56,7 +56,7 @@ export const TRANSFORM_FIELDS: Field<Transform>[] = [
     info: (
       <>
         A valid Druid{' '}
-        <ExternalLink href={`${getLink('DOCS')}/misc/math-expr.html`}>expression</ExternalLink>.
+        <ExternalLink href={`${getLink('DOCS')}/misc/math-expr`}>expression</ExternalLink>.
       </>
     ),
   },
@@ -83,8 +83,8 @@ export function getTimestampExpressionFields(transforms: Transform[]): Field<Tra
       info: (
         <>
           A valid Druid{' '}
-          <ExternalLink href={`${getLink('DOCS')}/misc/math-expr.html`}>expression</ExternalLink>{' '}
-          that should output a millis timestamp. You most likely want to use the{' '}
+          <ExternalLink href={`${getLink('DOCS')}/misc/math-expr`}>expression</ExternalLink> that
+          should output a millis timestamp. You most likely want to use the{' '}
           <Code>timestamp_parse</Code> function at the outer level.
         </>
       ),
diff --git a/web-console/src/helpers/capabilities.ts b/web-console/src/helpers/capabilities.ts
index ce8509072f2..4b10a49c965 100644
--- a/web-console/src/helpers/capabilities.ts
+++ b/web-console/src/helpers/capabilities.ts
@@ -38,7 +38,7 @@ export interface CapabilitiesValue {
   multiStageQuery: boolean;
   coordinator: boolean;
   overlord: boolean;
-  clusterCapacity?: number;
+  maxTaskSlots?: number;
 }
 
 export class Capabilities {
@@ -54,7 +54,7 @@ export class Capabilities {
   private readonly multiStageQuery: boolean;
   private readonly coordinator: boolean;
   private readonly overlord: boolean;
-  private readonly clusterCapacity?: number;
+  private readonly maxTaskSlots?: number;
 
   static async detectQueryType(): Promise<QueryType | undefined> {
     // Check SQL endpoint
@@ -171,7 +171,7 @@ export class Capabilities {
 
     return new Capabilities({
       ...capabilities.valueOf(),
-      clusterCapacity: capacity.totalTaskSlots,
+      maxTaskSlots: capacity.totalTaskSlots,
     });
   }
 
@@ -180,7 +180,7 @@ export class Capabilities {
     this.multiStageQuery = value.multiStageQuery;
     this.coordinator = value.coordinator;
     this.overlord = value.overlord;
-    this.clusterCapacity = value.clusterCapacity;
+    this.maxTaskSlots = value.maxTaskSlots;
   }
 
   public valueOf(): CapabilitiesValue {
@@ -189,7 +189,7 @@ export class Capabilities {
       multiStageQuery: this.multiStageQuery,
       coordinator: this.coordinator,
       overlord: this.overlord,
-      clusterCapacity: this.clusterCapacity,
+      maxTaskSlots: this.maxTaskSlots,
     };
   }
 
@@ -263,8 +263,8 @@ export class Capabilities {
     return this.hasSql() || this.hasOverlordAccess();
   }
 
-  public getClusterCapacity(): number | undefined {
-    return this.clusterCapacity;
+  public getMaxTaskSlots(): number | undefined {
+    return this.maxTaskSlots;
   }
 }
 Capabilities.FULL = new Capabilities({
diff --git a/web-console/src/helpers/execution/sql-task-execution.ts b/web-console/src/helpers/execution/sql-task-execution.ts
index f0aa7dde54c..ca7c0485bd4 100644
--- a/web-console/src/helpers/execution/sql-task-execution.ts
+++ b/web-console/src/helpers/execution/sql-task-execution.ts
@@ -23,10 +23,6 @@ import type { AsyncStatusResponse, MsqTaskPayloadResponse, QueryContext } from '
 import { Execution } from '../../druid-models';
 import { Api } from '../../singletons';
 import { deepGet, DruidError, IntermediateQueryState, QueryManager } from '../../utils';
-import { maybeGetClusterCapacity } from '../capacity';
-
-const USE_TASK_PAYLOAD = true;
-const USE_TASK_REPORTS = true;
 
 // some executionMode has to be set on the /druid/v2/sql/statements API
 function ensureExecutionModeIsSet(context: QueryContext | undefined): QueryContext {
@@ -161,7 +157,7 @@ export async function getTaskExecution(
 
   let execution: Execution | undefined;
 
-  if (USE_TASK_REPORTS) {
+  if (Execution.USE_TASK_REPORTS) {
     let taskReport: any;
     try {
       taskReport = (
@@ -198,7 +194,7 @@ export async function getTaskExecution(
   }
 
   let taskPayload = taskPayloadOverride;
-  if (USE_TASK_PAYLOAD && !taskPayload) {
+  if (Execution.USE_TASK_PAYLOAD && !taskPayload) {
     try {
       taskPayload = (
         await Api.instance.get(`/druid/indexer/v1/task/${encodedId}`, {
@@ -229,8 +225,8 @@ export async function getTaskExecution(
     }
   }
 
-  if (execution.hasPotentiallyStuckStage()) {
-    const capacityInfo = await maybeGetClusterCapacity();
+  if (Execution.getClusterCapacity && execution.hasPotentiallyStuckStage()) {
+    const capacityInfo = await Execution.getClusterCapacity();
     if (capacityInfo) {
       execution = execution.changeCapacityInfo(capacityInfo);
     }
diff --git a/web-console/src/helpers/spec-conversion.ts b/web-console/src/helpers/spec-conversion.ts
index 7e7673c7384..2c621f2466c 100644
--- a/web-console/src/helpers/spec-conversion.ts
+++ b/web-console/src/helpers/spec-conversion.ts
@@ -46,8 +46,8 @@ import {
 } from '../druid-models';
 import { deepGet, filterMap, nonEmptyArray, oneOf } from '../utils';
 
-export function getSpecDatasourceName(spec: Partial<IngestionSpec>): string {
-  return deepGet(spec, 'spec.dataSchema.dataSource') || 'unknown_datasource';
+export function getSpecDatasourceName(spec: Partial<IngestionSpec>): string | undefined {
+  return deepGet(spec, 'spec.dataSchema.dataSource');
 }
 
 function convertFilter(filter: any): SqlExpression {
diff --git a/web-console/src/hooks/use-query-manager.ts b/web-console/src/hooks/use-query-manager.ts
index a21d7b64691..38444374583 100644
--- a/web-console/src/hooks/use-query-manager.ts
+++ b/web-console/src/hooks/use-query-manager.ts
@@ -58,7 +58,7 @@ export function useQueryManager<Q, R, I = never, E extends Error = Error>(
     // will be compatible with future React versions that may mount/unmount/remount
     // the same component multiple times while.
     //
-    // See https://reactjs.org/docs/strict-mode.html#ensuring-reusable-state
+    // See https://reactjs.org/docs/strict-mode#ensuring-reusable-state
     // and https://github.com/reactwg/react-18/discussions/18
     let myQueryManager = queryManager;
     if (queryManager.isTerminated()) {
diff --git a/web-console/src/links.ts b/web-console/src/links.ts
index ccd26367969..552ca5e8122 100644
--- a/web-console/src/links.ts
+++ b/web-console/src/links.ts
@@ -40,7 +40,7 @@ const DEFAULT_LINKS: Links = {
   communityHref: 'https://druid.apache.org/community/',
   slackHref: 'https://druid.apache.org/community/join-slack',
   userGroup: 'https://groups.google.com/forum/#!forum/druid-user',
-  developerGroup: 'https://lists.apache.org/list.html?dev@druid.apache.org',
+  developerGroup: 'https://lists.apache.org/list?dev@druid.apache.org',
 };
 
 const links = DEFAULT_LINKS;
@@ -76,13 +76,13 @@ export function getLink(linkName: LinkNames): string {
     case 'DOCS':
       return links.docsHref;
     case 'DOCS_SQL':
-      return `${links.docsHref}/querying/sql.html`;
+      return `${links.docsHref}/querying/sql`;
     case 'DOCS_RUNE':
-      return `${links.docsHref}/querying/querying.html`;
+      return `${links.docsHref}/querying/querying`;
     case 'DOCS_API':
-      return `${links.docsHref}/api-reference/api-reference.html`;
+      return `${links.docsHref}/api-reference/api-reference`;
     case 'DOCS_MSQ_ERROR':
-      return `${links.docsHref}/multi-stage-query/reference.html`;
+      return `${links.docsHref}/multi-stage-query/reference`;
     case 'COMMUNITY':
       return links.communityHref;
     case 'SLACK':
diff --git a/web-console/src/utils/joda-to-regexp.ts b/web-console/src/utils/joda-to-regexp.ts
index 10ca006986a..8c412dd8911 100644
--- a/web-console/src/utils/joda-to-regexp.ts
+++ b/web-console/src/utils/joda-to-regexp.ts
@@ -16,7 +16,7 @@
  * limitations under the License.
  */
 
-// Refer to https://www.joda.org/joda-time/key_format.html
+// Refer to https://www.joda.org/joda-time/key_format
 const TEXT = '\\w+';
 const NUMBER_2_DIGIT = '[0-9]{2}';
 const NUMBER_4_DIGIT = '[0-9]{4}';
diff --git a/web-console/src/views/home-view/__snapshots__/home-view.spec.tsx.snap b/web-console/src/views/home-view/__snapshots__/home-view.spec.tsx.snap
index c78b0a80f7e..657e9e4a651 100644
--- a/web-console/src/views/home-view/__snapshots__/home-view.spec.tsx.snap
+++ b/web-console/src/views/home-view/__snapshots__/home-view.spec.tsx.snap
@@ -7,8 +7,8 @@ exports[`HomeView matches snapshot (coordinator) 1`] = `
   <Memo(StatusCard)
     capabilities={
       Capabilities {
-        "clusterCapacity": undefined,
         "coordinator": true,
+        "maxTaskSlots": undefined,
         "multiStageQuery": false,
         "overlord": false,
         "queryType": "none",
@@ -19,8 +19,8 @@ exports[`HomeView matches snapshot (coordinator) 1`] = `
     <Memo(DatasourcesCard)
       capabilities={
         Capabilities {
-          "clusterCapacity": undefined,
           "coordinator": true,
+          "maxTaskSlots": undefined,
           "multiStageQuery": false,
           "overlord": false,
           "queryType": "none",
@@ -30,8 +30,8 @@ exports[`HomeView matches snapshot (coordinator) 1`] = `
     <Memo(SegmentsCard)
       capabilities={
         Capabilities {
-          "clusterCapacity": undefined,
           "coordinator": true,
+          "maxTaskSlots": undefined,
           "multiStageQuery": false,
           "overlord": false,
           "queryType": "none",
@@ -42,8 +42,8 @@ exports[`HomeView matches snapshot (coordinator) 1`] = `
   <Memo(ServicesCard)
     capabilities={
       Capabilities {
-        "clusterCapacity": undefined,
         "coordinator": true,
+        "maxTaskSlots": undefined,
         "multiStageQuery": false,
         "overlord": false,
         "queryType": "none",
@@ -53,8 +53,8 @@ exports[`HomeView matches snapshot (coordinator) 1`] = `
   <Memo(LookupsCard)
     capabilities={
       Capabilities {
-        "clusterCapacity": undefined,
         "coordinator": true,
+        "maxTaskSlots": undefined,
         "multiStageQuery": false,
         "overlord": false,
         "queryType": "none",
@@ -71,8 +71,8 @@ exports[`HomeView matches snapshot (full) 1`] = `
   <Memo(StatusCard)
     capabilities={
       Capabilities {
-        "clusterCapacity": undefined,
         "coordinator": true,
+        "maxTaskSlots": undefined,
         "multiStageQuery": true,
         "overlord": true,
         "queryType": "nativeAndSql",
@@ -83,8 +83,8 @@ exports[`HomeView matches snapshot (full) 1`] = `
     <Memo(DatasourcesCard)
       capabilities={
         Capabilities {
-          "clusterCapacity": undefined,
           "coordinator": true,
+          "maxTaskSlots": undefined,
           "multiStageQuery": true,
           "overlord": true,
           "queryType": "nativeAndSql",
@@ -94,8 +94,8 @@ exports[`HomeView matches snapshot (full) 1`] = `
     <Memo(SegmentsCard)
       capabilities={
         Capabilities {
-          "clusterCapacity": undefined,
           "coordinator": true,
+          "maxTaskSlots": undefined,
           "multiStageQuery": true,
           "overlord": true,
           "queryType": "nativeAndSql",
@@ -107,8 +107,8 @@ exports[`HomeView matches snapshot (full) 1`] = `
     <Memo(SupervisorsCard)
       capabilities={
         Capabilities {
-          "clusterCapacity": undefined,
           "coordinator": true,
+          "maxTaskSlots": undefined,
           "multiStageQuery": true,
           "overlord": true,
           "queryType": "nativeAndSql",
@@ -118,8 +118,8 @@ exports[`HomeView matches snapshot (full) 1`] = `
     <Memo(TasksCard)
       capabilities={
         Capabilities {
-          "clusterCapacity": undefined,
           "coordinator": true,
+          "maxTaskSlots": undefined,
           "multiStageQuery": true,
           "overlord": true,
           "queryType": "nativeAndSql",
@@ -130,8 +130,8 @@ exports[`HomeView matches snapshot (full) 1`] = `
   <Memo(ServicesCard)
     capabilities={
       Capabilities {
-        "clusterCapacity": undefined,
         "coordinator": true,
+        "maxTaskSlots": undefined,
         "multiStageQuery": true,
         "overlord": true,
         "queryType": "nativeAndSql",
@@ -141,8 +141,8 @@ exports[`HomeView matches snapshot (full) 1`] = `
   <Memo(LookupsCard)
     capabilities={
       Capabilities {
-        "clusterCapacity": undefined,
         "coordinator": true,
+        "maxTaskSlots": undefined,
         "multiStageQuery": true,
         "overlord": true,
         "queryType": "nativeAndSql",
@@ -159,8 +159,8 @@ exports[`HomeView matches snapshot (overlord) 1`] = `
   <Memo(StatusCard)
     capabilities={
       Capabilities {
-        "clusterCapacity": undefined,
         "coordinator": false,
+        "maxTaskSlots": undefined,
         "multiStageQuery": false,
         "overlord": true,
         "queryType": "none",
@@ -171,8 +171,8 @@ exports[`HomeView matches snapshot (overlord) 1`] = `
     <Memo(SupervisorsCard)
       capabilities={
         Capabilities {
-          "clusterCapacity": undefined,
           "coordinator": false,
+          "maxTaskSlots": undefined,
           "multiStageQuery": false,
           "overlord": true,
           "queryType": "none",
@@ -182,8 +182,8 @@ exports[`HomeView matches snapshot (overlord) 1`] = `
     <Memo(TasksCard)
       capabilities={
         Capabilities {
-          "clusterCapacity": undefined,
           "coordinator": false,
+          "maxTaskSlots": undefined,
           "multiStageQuery": false,
           "overlord": true,
           "queryType": "none",
diff --git a/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap b/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap
index 266bfc9c05c..6bbafa818c0 100644
--- a/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap
+++ b/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap
@@ -182,7 +182,7 @@ exports[`LoadDataView matches snapshot batch 1`] = `
           >
             <img
               alt="Ingestion tile for index_parallel:azureStorage"
-              src="/some/base_url/assets/azureStorage.png"
+              src="/some/base_url/assets/azure-storage.png"
             />
             <p>
               Azure Data Lake
diff --git a/web-console/src/views/load-data-view/info-messages.tsx b/web-console/src/views/load-data-view/info-messages.tsx
index ad9e96667db..e3a5e7f3993 100644
--- a/web-console/src/views/load-data-view/info-messages.tsx
+++ b/web-console/src/views/load-data-view/info-messages.tsx
@@ -38,9 +38,7 @@ export const ConnectMessage = React.memo(function ConnectMessage(props: ConnectM
       <Callout>
         <p>
           Druid ingests raw data and converts it into a custom,{' '}
-          <ExternalLink href={`${getLink('DOCS')}/design/segments.html`}>
-            indexed format
-          </ExternalLink>{' '}
+          <ExternalLink href={`${getLink('DOCS')}/design/segments`}>indexed format</ExternalLink>{' '}
           that is optimized for analytic queries.
         </p>
         {inlineMode ? (
@@ -67,10 +65,10 @@ export const ParserMessage = React.memo(function ParserMessage() {
         </p>
         <p>
           If you have nested data, you can ingest it as{' '}
-          <ExternalLink href={`${getLink('DOCS')}/querying/nested-columns.html`}>json</ExternalLink>{' '}
+          <ExternalLink href={`${getLink('DOCS')}/querying/nested-columns`}>json</ExternalLink>{' '}
           dimensions.
         </p>
-        <LearnMore href={`${getLink('DOCS')}/ingestion/data-formats.html`} />
+        <LearnMore href={`${getLink('DOCS')}/ingestion/data-formats`} />
       </Callout>
     </FormGroup>
   );
@@ -91,7 +89,7 @@ export const TimestampMessage = React.memo(function TimestampMessage() {
           combine them into one by selecting <Code>Expression</Code> and defining a transform
           expression.
         </p>
-        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#timestampspec`} />
+        <LearnMore href={`${getLink('DOCS')}/ingestion/ingestion-spec#timestampspec`} />
       </Callout>
     </FormGroup>
   );
@@ -103,12 +101,12 @@ export const TransformMessage = React.memo(function TransformMessage() {
       <Callout>
         <p>
           Druid can perform per-row{' '}
-          <ExternalLink href={`${getLink('DOCS')}/ingestion/transform-spec.html#transforms`}>
+          <ExternalLink href={`${getLink('DOCS')}/ingestion/transform-spec#transforms`}>
             transforms
           </ExternalLink>{' '}
           of column values allowing you to create new derived columns or alter existing column.
         </p>
-        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#transforms`} />
+        <LearnMore href={`${getLink('DOCS')}/ingestion/ingestion-spec#transforms`} />
       </Callout>
     </FormGroup>
   );
@@ -120,9 +118,9 @@ export const FilterMessage = React.memo(function FilterMessage() {
       <Callout>
         <p>
           Druid can filter out unwanted data by applying per-row{' '}
-          <ExternalLink href={`${getLink('DOCS')}/querying/filters.html`}>filters</ExternalLink>.
+          <ExternalLink href={`${getLink('DOCS')}/querying/filters`}>filters</ExternalLink>.
         </p>
-        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#filter`} />
+        <LearnMore href={`${getLink('DOCS')}/ingestion/ingestion-spec#filter`} />
       </Callout>
     </FormGroup>
   );
@@ -148,7 +146,7 @@ export const SchemaMessage = React.memo(function SchemaMessage(props: SchemaMess
             change the type, click on the column header.
           </p>
         )}
-        <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design.html`} />
+        <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design`} />
       </Callout>
     </FormGroup>
   );
@@ -164,7 +162,7 @@ export const PartitionMessage = React.memo(function PartitionMessage() {
           <Code>Primary partitioning</Code>), and each time chunk contains one or more segments (
           <Code>Secondary partitioning</Code>).
         </p>
-        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#partitioning`} />
+        <LearnMore href={`${getLink('DOCS')}/ingestion/partitioning`} />
       </Callout>
     </FormGroup>
   );
@@ -175,7 +173,7 @@ export const TuningMessage = React.memo(function TuningMessage() {
     <FormGroup>
       <Callout>
         <p>Fine tune how Druid will ingest data.</p>
-        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#tuningconfig`} />
+        <LearnMore href={`${getLink('DOCS')}/ingestion/ingestion-spec#tuningconfig`} />
       </Callout>
     </FormGroup>
   );
@@ -201,7 +199,7 @@ export const SpecMessage = React.memo(function SpecMessage() {
           you modify any values in previous sections, this spec will automatically update.
         </p>
         <p>Submit the spec to begin loading data into Druid.</p>
-        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#ingestion-specs`} />
+        <LearnMore href={`${getLink('DOCS')}/ingestion/ingestion-spec`} />
       </Callout>
     </FormGroup>
   );
diff --git a/web-console/src/views/load-data-view/load-data-view.scss b/web-console/src/views/load-data-view/load-data-view.scss
index 8532313b10b..d5248c5190d 100644
--- a/web-console/src/views/load-data-view/load-data-view.scss
+++ b/web-console/src/views/load-data-view/load-data-view.scss
@@ -273,6 +273,7 @@ $actual-icon-height: 400px;
   }
 
   .control {
+    position: relative;
     grid-area: ctrl;
     overflow: auto;
     padding: 0 5px;
@@ -320,4 +321,10 @@ $actual-icon-height: 400px;
   .parse-metadata {
     border-top: 1px solid $gray1;
   }
+
+  .suspended-switch {
+    position: absolute;
+    bottom: 0;
+    right: 5px;
+  }
 }
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 5e907a24267..555ba6f4a09 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -56,7 +56,7 @@ import {
   Loader,
   PopoverText,
 } from '../../components';
-import { AlertDialog, AsyncActionDialog } from '../../dialogs';
+import { AlertDialog, AsyncActionDialog, DiffDialog } from '../../dialogs';
 import type {
   ArrayMode,
   DimensionSpec,
@@ -146,6 +146,7 @@ import {
   deepMove,
   deepSet,
   deepSetMulti,
+  deleteKeys,
   EMPTY_ARRAY,
   EMPTY_OBJECT,
   filterMap,
@@ -427,6 +428,8 @@ export interface LoadDataViewState {
   // for final step
   existingDatasources?: string[];
   submitting: boolean;
+  currentSupervisorSpec?: Partial<IngestionSpec>;
+  showDiffWithCurrent: boolean;
 }
 
 export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDataViewState> {
@@ -478,6 +481,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
 
       // for final step
       submitting: false,
+      showDiffWithCurrent: false,
     };
   }
 
@@ -1006,7 +1010,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
         return (
           <p>
             If you do not see your source of raw data here, you can try to ingest it by submitting a{' '}
-            <ExternalLink href={`${getLink('DOCS')}/ingestion/index.html`}>
+            <ExternalLink href={`${getLink('DOCS')}/ingestion/`}>
               JSON task or supervisor spec
             </ExternalLink>
             .
@@ -1707,7 +1711,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
           />
           <AnchorButton
             icon={IconNames.INFO_SIGN}
-            href={`${getLink('DOCS')}/ingestion/data-formats.html#flattenspec`}
+            href={`${getLink('DOCS')}/ingestion/data-formats#flattenspec`}
             target="_blank"
             minimal
           />
@@ -2377,12 +2381,12 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
                     <p>
                       Select whether or not you want to set an explicit list of{' '}
                       <ExternalLink
-                        href={`${getLink('DOCS')}/ingestion/ingestion-spec.html#dimensionsspec`}
+                        href={`${getLink('DOCS')}/ingestion/ingestion-spec#dimensionsspec`}
                       >
                         dimensions
                       </ExternalLink>{' '}
                       and{' '}
-                      <ExternalLink href={`${getLink('DOCS')}/querying/aggregations.html`}>
+                      <ExternalLink href={`${getLink('DOCS')}/querying/aggregations`}>
                         metrics
                       </ExternalLink>
                       . Explicitly setting dimensions and metrics can lead to better compression and
@@ -2437,7 +2441,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
                   <PopoverText>
                     <p>
                       If you enable{' '}
-                      <ExternalLink href={`${getLink('DOCS')}/tutorials/tutorial-rollup.html`}>
+                      <ExternalLink href={`${getLink('DOCS')}/tutorials/tutorial-rollup`}>
                         roll-up
                       </ExternalLink>
                       , Druid will try to pre-aggregate data before indexing it to conserve storage.
@@ -2446,12 +2450,12 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
                     </p>
                     <p>
                       If you enable rollup, you must specify which columns are{' '}
-                      <a href={`${getLink('DOCS')}/ingestion/ingestion-spec.html#dimensionsspec`}>
+                      <a href={`${getLink('DOCS')}/ingestion/ingestion-spec#dimensionsspec`}>
                         dimensions
                       </a>{' '}
                       (fields you want to group and filter on), and which are{' '}
-                      <a href={`${getLink('DOCS')}/querying/aggregations.html`}>metrics</a> (fields
-                      you want to aggregate on).
+                      <a href={`${getLink('DOCS')}/querying/aggregations`}>metrics</a> (fields you
+                      want to aggregate on).
                     </p>
                   </PopoverText>
                 }
@@ -2708,7 +2712,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
               <ExternalLink
                 href={`${getLink(
                   'DOCS',
-                )}/ingestion/schema-design.html#schema-auto-discovery-for-dimensions`}
+                )}/ingestion/schema-design#schema-auto-discovery-for-dimensions`}
               >
                 documentation
               </ExternalLink>
@@ -2743,7 +2747,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
             ),
           );
         }}
-        confirmButtonText={`Yes - ${multiValues ? 'use MVDs' : 'ARRAYs'}`}
+        confirmButtonText={`Yes - use ${multiValues ? 'MVDs' : 'ARRAYs'}`}
         successText={`Array mode changed to ${multiValues ? 'multi-values' : 'arrays'}.`}
         failText="Could not change array mode"
         intent={Intent.WARNING}
@@ -3283,9 +3287,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
                 </p>
                 <p>
                   For more information refer to the{' '}
-                  <ExternalLink
-                    href={`${getLink('DOCS')}/ingestion/concurrent-append-replace.html`}
-                  >
+                  <ExternalLink href={`${getLink('DOCS')}/ingestion/concurrent-append-replace`}>
                     documentation
                   </ExternalLink>
                   .
@@ -3407,6 +3409,8 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
   };
 
   async queryForSpec() {
+    const { spec } = this.state;
+
     let existingDatasources: string[];
     try {
       existingDatasources = (await Api.instance.get<string[]>('/druid/coordinator/v1/datasources'))
@@ -3415,13 +3419,26 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
       return;
     }
 
+    let currentSupervisorSpec: Partial<IngestionSpec> | undefined;
+    const supervisorId = getSpecDatasourceName(spec);
+    if (isStreamingSpec(spec) && supervisorId) {
+      try {
+        currentSupervisorSpec = cleanSpec(
+          (await Api.instance.get(`/druid/indexer/v1/supervisor/${Api.encodePath(supervisorId)}`))
+            .data,
+        );
+      } catch {}
+    }
+
     this.setState({
       existingDatasources,
+      currentSupervisorSpec,
     });
   }
 
   renderSpecStep() {
-    const { spec, existingDatasources, submitting } = this.state;
+    const { spec, existingDatasources, submitting, currentSupervisorSpec, showDiffWithCurrent } =
+      this.state;
     const issueWithSpec = getIssueWithSpec(spec);
     const datasource = deepGet(spec, 'spec.dataSchema.dataSource');
 
@@ -3465,7 +3482,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
                     <ExternalLink
                       href={`${getLink(
                         'DOCS',
-                      )}/ingestion/schema-design.html#schema-auto-discovery-for-dimensions`}
+                      )}/ingestion/schema-design#schema-auto-discovery-for-dimensions`}
                     >
                       documentation
                     </ExternalLink>
@@ -3475,75 +3492,124 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
               </FormGroup>
             )}
           <AppendToExistingIssue spec={spec} onChangeSpec={this.updateSpec} />
-        </div>
-        <div className="next-bar">
-          {!isEmptyIngestionSpec(spec) && (
+          {isStreamingSpec(spec) && currentSupervisorSpec && (
             <Button
-              className="left"
-              icon={IconNames.RESET}
-              text="Reset spec"
-              onClick={this.handleResetConfirm}
+              icon={IconNames.DELTA}
+              text="Diff with current supervisor spec"
+              onClick={() => {
+                this.setState({
+                  showDiffWithCurrent: true,
+                });
+              }}
+            />
+          )}
+          {isStreamingSpec(spec) && (
+            <Switch
+              className="suspended-switch"
+              checked={Boolean(spec.suspended)}
+              label="Submit in suspended state"
+              onChange={() =>
+                this.updateSpec(
+                  spec.suspended ? deleteKeys(spec, ['suspended']) : { ...spec, suspended: true },
+                )
+              }
             />
           )}
-          <Button
-            text={submitting ? 'Submitting...' : 'Submit'}
-            rightIcon={IconNames.CLOUD_UPLOAD}
-            intent={Intent.PRIMARY}
-            disabled={submitting || Boolean(issueWithSpec)}
-            onClick={() => void this.handleSubmit()}
-          />
         </div>
+        <div className="next-bar">
+          {isStreamingSpec(spec) ? (
+            <Button
+              text={
+                submitting
+                  ? 'Submitting...'
+                  : `Submit supervisor (${spec.suspended ? 'suspended' : 'running'})`
+              }
+              rightIcon={IconNames.CLOUD_UPLOAD}
+              intent={Intent.PRIMARY}
+              disabled={submitting || Boolean(issueWithSpec)}
+              onClick={() => void this.handleSubmitSupervisor()}
+            />
+          ) : (
+            <Button
+              text={submitting ? 'Submitting...' : 'Submit task'}
+              rightIcon={IconNames.CLOUD_UPLOAD}
+              intent={Intent.PRIMARY}
+              disabled={submitting || Boolean(issueWithSpec)}
+              onClick={() => void this.handleSubmitTask()}
+            />
+          )}
+        </div>
+        {showDiffWithCurrent && currentSupervisorSpec && (
+          <DiffDialog
+            title="Diff with current spec"
+            oldValue={currentSupervisorSpec}
+            newValue={spec}
+            onClose={() => {
+              this.setState({
+                showDiffWithCurrent: false,
+              });
+            }}
+          />
+        )}
       </>
     );
   }
 
-  private readonly handleSubmit = async () => {
-    const { goToSupervisor, goToTasks } = this.props;
+  private readonly handleSubmitSupervisor = async () => {
+    const { goToSupervisor } = this.props;
     const { spec, submitting } = this.state;
     if (submitting) return;
 
     this.setState({ submitting: true });
-    if (isStreamingSpec(spec)) {
-      try {
-        await Api.instance.post('/druid/indexer/v1/supervisor', spec);
-      } catch (e) {
-        AppToaster.show({
-          message: `Failed to submit supervisor: ${getDruidErrorMessage(e)}`,
-          intent: Intent.DANGER,
-        });
-        this.setState({ submitting: false });
-        return;
-      }
-
+    try {
+      await Api.instance.post('/druid/indexer/v1/supervisor', spec);
+    } catch (e) {
       AppToaster.show({
-        message: 'Supervisor submitted successfully. Going to task view...',
-        intent: Intent.SUCCESS,
+        message: `Failed to submit supervisor: ${getDruidErrorMessage(e)}`,
+        intent: Intent.DANGER,
       });
+      this.setState({ submitting: false });
+      return;
+    }
 
+    AppToaster.show({
+      message: 'Supervisor submitted successfully. Going to Supervisors view...',
+      intent: Intent.SUCCESS,
+    });
+
+    const supervisorId = getSpecDatasourceName(spec);
+    if (supervisorId) {
       setTimeout(() => {
-        goToSupervisor(getSpecDatasourceName(spec));
-      }, 1000);
-    } else {
-      let taskResp: any;
-      try {
-        taskResp = await Api.instance.post('/druid/indexer/v1/task', spec);
-      } catch (e) {
-        AppToaster.show({
-          message: `Failed to submit task: ${getDruidErrorMessage(e)}`,
-          intent: Intent.DANGER,
-        });
-        this.setState({ submitting: false });
-        return;
-      }
-
-      AppToaster.show({
-        message: 'Task submitted successfully. Going to task view...',
-        intent: Intent.SUCCESS,
-      });
-
-      setTimeout(() => {
-        goToTasks(taskResp.data.task);
+        goToSupervisor(supervisorId);
       }, 1000);
     }
   };
+
+  private readonly handleSubmitTask = async () => {
+    const { goToTasks } = this.props;
+    const { spec, submitting } = this.state;
+    if (submitting) return;
+
+    this.setState({ submitting: true });
+    let taskResp: any;
+    try {
+      taskResp = await Api.instance.post('/druid/indexer/v1/task', spec);
+    } catch (e) {
+      AppToaster.show({
+        message: `Failed to submit task: ${getDruidErrorMessage(e)}`,
+        intent: Intent.DANGER,
+      });
+      this.setState({ submitting: false });
+      return;
+    }
+
+    AppToaster.show({
+      message: 'Task submitted successfully. Going to Tasks view...',
+      intent: Intent.SUCCESS,
+    });
+
+    setTimeout(() => {
+      goToTasks(taskResp.data.task);
+    }, 1000);
+  };
 }
diff --git a/web-console/src/views/sql-data-loader-view/ingestion-progress-dialog/ingestion-progress-dialog.tsx b/web-console/src/views/sql-data-loader-view/ingestion-progress-dialog/ingestion-progress-dialog.tsx
index 261fe929bfc..ac6def8151c 100644
--- a/web-console/src/views/sql-data-loader-view/ingestion-progress-dialog/ingestion-progress-dialog.tsx
+++ b/web-console/src/views/sql-data-loader-view/ingestion-progress-dialog/ingestion-progress-dialog.tsx
@@ -33,7 +33,8 @@ import './ingestion-progress-dialog.scss';
 interface IngestionProgressDialogProps {
   taskId: string;
   goToQuery(queryWithContext: QueryWithContext): void;
-  goToTask(taskId: string): void;
+  goToTask(taskGroupId: string): void;
+  goToTaskGroup(taskGroupId: string): void;
   onReset(): void;
   onClose(): void;
 }
@@ -41,7 +42,7 @@ interface IngestionProgressDialogProps {
 export const IngestionProgressDialog = React.memo(function IngestionProgressDialog(
   props: IngestionProgressDialogProps,
 ) {
-  const { taskId, goToQuery, goToTask, onReset, onClose } = props;
+  const { taskId, goToQuery, goToTask, goToTaskGroup, onReset, onClose } = props;
   const [showLiveReports, setShowLiveReports] = useState(false);
 
   const [insertResultState, ingestQueryManager] = useQueryManager<string, Execution, Execution>({
@@ -104,7 +105,7 @@ export const IngestionProgressDialog = React.memo(function IngestionProgressDial
                 rightIcon={IconNames.ARROW_TOP_RIGHT}
                 onClick={() => {
                   if (!insertResultState.intermediate) return;
-                  goToTask(insertResultState.intermediate.id);
+                  goToTaskGroup(insertResultState.intermediate.id);
                 }}
               />
             </>
diff --git a/web-console/src/views/sql-data-loader-view/schema-step/column-list/column-list.tsx b/web-console/src/views/sql-data-loader-view/schema-step/column-list/column-list.tsx
index e4c7a94c9e9..0b9da665176 100644
--- a/web-console/src/views/sql-data-loader-view/schema-step/column-list/column-list.tsx
+++ b/web-console/src/views/sql-data-loader-view/schema-step/column-list/column-list.tsx
@@ -76,7 +76,7 @@ export const ColumnList = function ColumnList(props: ColumnListProps) {
                       aggregated at query time. They are always single Strings, arrays of Strings,
                       single Longs, single Doubles or single Floats.
                     </p>
-                    <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design.html`} />
+                    <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design`} />
                   </PopoverText>
                 }
                 position="left-bottom"
@@ -122,7 +122,7 @@ export const ColumnList = function ColumnList(props: ColumnListProps) {
                     (integers or floats) but can also be stored as complex objects like HyperLogLog
                     sketches or approximate quantile sketches.
                   </p>
-                  <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design.html`} />
+                  <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design`} />
                 </PopoverText>
               }
               position="left-bottom"
diff --git a/web-console/src/views/sql-data-loader-view/schema-step/schema-step.tsx b/web-console/src/views/sql-data-loader-view/schema-step/schema-step.tsx
index 5f0d24f69b1..d9a1fdba6ac 100644
--- a/web-console/src/views/sql-data-loader-view/schema-step/schema-step.tsx
+++ b/web-console/src/views/sql-data-loader-view/schema-step/schema-step.tsx
@@ -900,7 +900,7 @@ export const SchemaStep = function SchemaStep(props: SchemaStepProps) {
                     of a column you can cast it to a specific type. You can do that by clicking on a
                     column header.
                   </p>
-                  <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design.html`} />
+                  <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design`} />
                 </Callout>
               </FormGroup>
             )}
@@ -961,7 +961,7 @@ export const SchemaStep = function SchemaStep(props: SchemaStepProps) {
                 <AnchorButton
                   icon={IconNames.HELP}
                   text="Learn more..."
-                  href={`${getLink('DOCS')}/ingestion/schema-model.html#primary-timestamp`}
+                  href={`${getLink('DOCS')}/ingestion/schema-model#primary-timestamp`}
                   target="_blank"
                   intent={Intent.WARNING}
                   minimal
diff --git a/web-console/src/views/sql-data-loader-view/sql-data-loader-view.tsx b/web-console/src/views/sql-data-loader-view/sql-data-loader-view.tsx
index c07bdd4380f..6cc00957b8d 100644
--- a/web-console/src/views/sql-data-loader-view/sql-data-loader-view.tsx
+++ b/web-console/src/views/sql-data-loader-view/sql-data-loader-view.tsx
@@ -23,14 +23,19 @@ import { SqlQuery, SqlTable } from '@druid-toolkit/query';
 import type { JSX } from 'react';
 import React, { useState } from 'react';
 
-import type { ExternalConfig, QueryContext, QueryWithContext } from '../../druid-models';
+import type {
+  CapacityInfo,
+  ExternalConfig,
+  QueryContext,
+  QueryWithContext,
+} from '../../druid-models';
 import {
   Execution,
   externalConfigToIngestQueryPattern,
   ingestQueryPatternToQuery,
 } from '../../druid-models';
 import type { Capabilities } from '../../helpers';
-import { maybeGetClusterCapacity, submitTaskQuery } from '../../helpers';
+import { submitTaskQuery } from '../../helpers';
 import { useLocalStorageState } from '../../hooks';
 import { AppToaster } from '../../singletons';
 import { deepDelete, LocalStorageKeys } from '../../utils';
@@ -58,12 +63,14 @@ export interface SqlDataLoaderViewProps {
   capabilities: Capabilities;
   goToQuery(queryWithContext: QueryWithContext): void;
   goToTask(taskId: string): void;
+  goToTaskGroup(taskGroupId: string): void;
+  getClusterCapacity: (() => Promise<CapacityInfo | undefined>) | undefined;
 }
 
 export const SqlDataLoaderView = React.memo(function SqlDataLoaderView(
   props: SqlDataLoaderViewProps,
 ) {
-  const { capabilities, goToQuery, goToTask } = props;
+  const { capabilities, goToQuery, goToTask, goToTaskGroup, getClusterCapacity } = props;
   const [alertElement, setAlertElement] = useState<JSX.Element | undefined>();
   const [externalConfigStep, setExternalConfigStep] = useState<Partial<ExternalConfig>>({});
   const [content, setContent] = useLocalStorageState<LoaderContent | undefined>(
@@ -145,7 +152,7 @@ export const SqlDataLoaderView = React.memo(function SqlDataLoaderView(
               return;
             }
 
-            const clusterCapacity = capabilities.getClusterCapacity();
+            const clusterCapacity = capabilities.getMaxTaskSlots();
             let effectiveContext = queryContext || {};
             if (
               typeof effectiveContext.maxNumTasks === 'undefined' &&
@@ -154,7 +161,7 @@ export const SqlDataLoaderView = React.memo(function SqlDataLoaderView(
               effectiveContext = { ...effectiveContext, maxNumTasks: clusterCapacity };
             }
 
-            const capacityInfo = await maybeGetClusterCapacity();
+            const capacityInfo = await getClusterCapacity?.();
 
             const effectiveMaxNumTasks = effectiveContext.maxNumTasks ?? 2;
 
@@ -177,7 +184,7 @@ export const SqlDataLoaderView = React.memo(function SqlDataLoaderView(
           }}
           extraCallout={
             <MaxTasksButton
-              clusterCapacity={capabilities.getClusterCapacity()}
+              clusterCapacity={capabilities.getMaxTaskSlots()}
               queryContext={content.queryContext || {}}
               changeQueryContext={queryContext => setContent({ ...content, queryContext })}
               minimal
@@ -239,7 +246,11 @@ export const SqlDataLoaderView = React.memo(function SqlDataLoaderView(
           taskId={content.id}
           goToQuery={goToQuery}
           goToTask={goToTask}
-          onReset={() => setContent(undefined)}
+          goToTaskGroup={goToTaskGroup}
+          onReset={() => {
+            setExternalConfigStep({});
+            setContent(undefined);
+          }}
           onClose={() => setContent(deepDelete(content, 'id'))}
         />
       )}
diff --git a/web-console/src/views/workbench-view/destination-pages-dialog/destination-pages-dialog.scss b/web-console/src/views/workbench-view/destination-pages-dialog/destination-pages-dialog.scss
index 430cdc300d1..bffc5f675f5 100644
--- a/web-console/src/views/workbench-view/destination-pages-dialog/destination-pages-dialog.scss
+++ b/web-console/src/views/workbench-view/destination-pages-dialog/destination-pages-dialog.scss
@@ -21,6 +21,14 @@
 .destination-pages-dialog {
   &.#{$bp-ns}-dialog {
     min-width: 700px;
-    min-height: 480px;
+    height: 80vh;
+  }
+
+  .destination-pages-pane {
+    height: 100%;
+  }
+
+  .#{$bp-ns}-dialog-footer {
+    margin-top: 0;
   }
 }
diff --git a/web-console/src/views/workbench-view/destination-pages-dialog/destination-pages-dialog.tsx b/web-console/src/views/workbench-view/destination-pages-dialog/destination-pages-dialog.tsx
index 68c66487e3c..7fed3ce83e1 100644
--- a/web-console/src/views/workbench-view/destination-pages-dialog/destination-pages-dialog.tsx
+++ b/web-console/src/views/workbench-view/destination-pages-dialog/destination-pages-dialog.tsx
@@ -16,7 +16,7 @@
  * limitations under the License.
  */
 
-import { Classes, Dialog } from '@blueprintjs/core';
+import { Button, Classes, Dialog } from '@blueprintjs/core';
 import React from 'react';
 
 import type { Execution } from '../../../druid-models';
@@ -39,6 +39,11 @@ export const DestinationPagesDialog = React.memo(function DestinationPagesDialog
       <div className={Classes.DIALOG_BODY}>
         <DestinationPagesPane execution={execution} />
       </div>
+      <div className={Classes.DIALOG_FOOTER}>
+        <div className={Classes.DIALOG_FOOTER_ACTIONS}>
+          <Button onClick={onClose}>Close</Button>
+        </div>
+      </div>
     </Dialog>
   );
 });
diff --git a/web-console/src/views/workbench-view/destination-pages-pane/destination-pages-pane.scss b/web-console/src/views/workbench-view/destination-pages-pane/destination-pages-pane.scss
index 09b8609af4b..86e9212c983 100644
--- a/web-console/src/views/workbench-view/destination-pages-pane/destination-pages-pane.scss
+++ b/web-console/src/views/workbench-view/destination-pages-pane/destination-pages-pane.scss
@@ -17,8 +17,15 @@
  */
 
 .destination-pages-pane {
+  display: flex;
+  flex-direction: column;
+
   .download-button {
     margin-top: 4px;
     margin-left: 2px;
   }
+
+  & > .ReactTable {
+    flex: 1;
+  }
 }
diff --git a/web-console/src/views/workbench-view/destination-pages-pane/destination-pages-pane.tsx b/web-console/src/views/workbench-view/destination-pages-pane/destination-pages-pane.tsx
index b58a75aea4b..0258233338c 100644
--- a/web-console/src/views/workbench-view/destination-pages-pane/destination-pages-pane.tsx
+++ b/web-console/src/views/workbench-view/destination-pages-pane/destination-pages-pane.tsx
@@ -177,7 +177,7 @@ export const DestinationPagesPane = React.memo(function DestinationPagesPane(
             Header: '',
             id: 'download',
             accessor: 'id',
-            width: 300,
+            width: 130,
             Cell: ({ value }) => (
               <AnchorButton
                 className="download-button"
diff --git a/web-console/src/views/workbench-view/execution-details-pane/__snapshots__/execution-details-pane.spec.tsx.snap b/web-console/src/views/workbench-view/execution-details-pane/__snapshots__/execution-details-pane.spec.tsx.snap
index 47b3234b2c6..7c6f08e47c8 100644
--- a/web-console/src/views/workbench-view/execution-details-pane/__snapshots__/execution-details-pane.spec.tsx.snap
+++ b/web-console/src/views/workbench-view/execution-details-pane/__snapshots__/execution-details-pane.spec.tsx.snap
@@ -38,7 +38,9 @@ exports[`ExecutionDetailsPane matches snapshot no init tab 1`] = `
     ]
   }
 >
-  <div>
+  <div
+    className="execution-details-pane-general"
+  >
     <p>
       General info for query-26d490c6-c06d-4cd2-938f-bc5f7f982754 ingesting into "kttm-blank-lines"
     </p>
diff --git a/web-console/src/views/workbench-view/execution-details-pane/execution-details-pane.scss b/web-console/src/views/workbench-view/execution-details-pane/execution-details-pane.scss
index 821e229db38..a1a7b8bd1a2 100644
--- a/web-console/src/views/workbench-view/execution-details-pane/execution-details-pane.scss
+++ b/web-console/src/views/workbench-view/execution-details-pane/execution-details-pane.scss
@@ -19,10 +19,18 @@
 .execution-details-pane {
   .main-section {
     overflow: auto;
+
+    & > * {
+      height: 100%;
+    }
   }
 
-  .flexible-query-input,
-  .result-table-pane {
-    height: 100%;
+  .execution-details-pane-general {
+    display: flex;
+    flex-direction: column;
+
+    .execution-stages-pane {
+      flex: 1;
+    }
   }
 }
diff --git a/web-console/src/views/workbench-view/execution-details-pane/execution-details-pane.tsx b/web-console/src/views/workbench-view/execution-details-pane/execution-details-pane.tsx
index 0f1200a8661..617c832e55a 100644
--- a/web-console/src/views/workbench-view/execution-details-pane/execution-details-pane.tsx
+++ b/web-console/src/views/workbench-view/execution-details-pane/execution-details-pane.tsx
@@ -61,7 +61,7 @@ export const ExecutionDetailsPane = React.memo(function ExecutionDetailsPane(
       case 'general': {
         const ingestDatasource = execution.getIngestDatasource();
         return (
-          <div>
+          <div className="execution-details-pane-general">
             <p>{`General info for ${execution.id}${
               ingestDatasource ? ` ingesting into ${T(ingestDatasource)}` : ''
             }`}</p>
diff --git a/web-console/src/views/workbench-view/execution-error-pane/__snapshots__/execution-error-pane.spec.tsx.snap b/web-console/src/views/workbench-view/execution-error-pane/__snapshots__/execution-error-pane.spec.tsx.snap
index 9d133e240ab..7fff3b26a3d 100644
--- a/web-console/src/views/workbench-view/execution-error-pane/__snapshots__/execution-error-pane.spec.tsx.snap
+++ b/web-console/src/views/workbench-view/execution-error-pane/__snapshots__/execution-error-pane.spec.tsx.snap
@@ -10,7 +10,7 @@ exports[`ExecutionErrorPane matches snapshot 1`] = `
   >
     <React.Fragment>
       <Memo(ExternalLink)
-        href="https://druid.apache.org/docs/latest/multi-stage-query/reference.html#error_TooManyWarnings"
+        href="https://druid.apache.org/docs/latest/multi-stage-query/reference#error_TooManyWarnings"
       >
         TooManyWarnings
       </Memo(ExternalLink)>
diff --git a/web-console/src/views/workbench-view/input-format-step/input-format-step.tsx b/web-console/src/views/workbench-view/input-format-step/input-format-step.tsx
index cfe51d8fc3d..3586170d63d 100644
--- a/web-console/src/views/workbench-view/input-format-step/input-format-step.tsx
+++ b/web-console/src/views/workbench-view/input-format-step/input-format-step.tsx
@@ -224,7 +224,7 @@ export const InputFormatStep = React.memo(function InputFormatStep(props: InputF
           <FormGroup>
             <Callout>
               <p>Ensure that your data appears correctly in a row/column orientation.</p>
-              <LearnMore href={`${getLink('DOCS')}/ingestion/data-formats.html`} />
+              <LearnMore href={`${getLink('DOCS')}/ingestion/data-formats`} />
             </Callout>
           </FormGroup>
           <AutoForm
diff --git a/web-console/src/views/workbench-view/query-tab/query-tab.tsx b/web-console/src/views/workbench-view/query-tab/query-tab.tsx
index 69234b58454..1c7aebdff69 100644
--- a/web-console/src/views/workbench-view/query-tab/query-tab.tsx
+++ b/web-console/src/views/workbench-view/query-tab/query-tab.tsx
@@ -27,11 +27,10 @@ import SplitterLayout from 'react-splitter-layout';
 import { useStore } from 'zustand';
 
 import { Loader, QueryErrorPane } from '../../../components';
-import type { DruidEngine, LastExecution, QueryContext } from '../../../druid-models';
+import type { CapacityInfo, DruidEngine, LastExecution, QueryContext } from '../../../druid-models';
 import { Execution, WorkbenchQuery } from '../../../druid-models';
 import {
   executionBackgroundStatusCheck,
-  maybeGetClusterCapacity,
   reattachTaskExecution,
   submitTaskQuery,
 } from '../../../helpers';
@@ -82,6 +81,7 @@ export interface QueryTabProps {
   runMoreMenu: JSX.Element;
   clusterCapacity: number | undefined;
   goToTask(taskId: string): void;
+  getClusterCapacity: (() => Promise<CapacityInfo | undefined>) | undefined;
 }
 
 export const QueryTab = React.memo(function QueryTab(props: QueryTabProps) {
@@ -97,6 +97,7 @@ export const QueryTab = React.memo(function QueryTab(props: QueryTabProps) {
     runMoreMenu,
     clusterCapacity,
     goToTask,
+    getClusterCapacity,
   } = props;
   const [alertElement, setAlertElement] = useState<JSX.Element | undefined>();
 
@@ -336,7 +337,7 @@ export const QueryTab = React.memo(function QueryTab(props: QueryTabProps) {
         ? effectiveQuery.makePreview()
         : effectiveQuery.setMaxNumTasksIfUnset(clusterCapacity);
 
-      const capacityInfo = await maybeGetClusterCapacity();
+      const capacityInfo = await getClusterCapacity?.();
 
       const effectiveMaxNumTasks = effectiveQuery.queryContext.maxNumTasks ?? 2;
       if (capacityInfo && capacityInfo.availableTaskSlots < effectiveMaxNumTasks) {
diff --git a/web-console/src/views/workbench-view/workbench-view.tsx b/web-console/src/views/workbench-view/workbench-view.tsx
index 625c6c514c6..9fbba23ca1e 100644
--- a/web-console/src/views/workbench-view/workbench-view.tsx
+++ b/web-console/src/views/workbench-view/workbench-view.tsx
@@ -26,7 +26,13 @@ import copy from 'copy-to-clipboard';
 import React from 'react';
 
 import { SpecDialog, StringInputDialog } from '../../dialogs';
-import type { DruidEngine, Execution, QueryWithContext, TabEntry } from '../../druid-models';
+import type {
+  CapacityInfo,
+  DruidEngine,
+  Execution,
+  QueryWithContext,
+  TabEntry,
+} from '../../druid-models';
 import { guessDataSourceNameFromInputSource, WorkbenchQuery } from '../../druid-models';
 import type { Capabilities } from '../../helpers';
 import { convertSpecToSql, getSpecDatasourceName, getTaskExecution } from '../../helpers';
@@ -87,6 +93,7 @@ export interface WorkbenchViewProps {
   queryEngines: DruidEngine[];
   allowExplain: boolean;
   goToTask(taskId: string): void;
+  getClusterCapacity: (() => Promise<CapacityInfo | undefined>) | undefined;
 }
 
 export interface WorkbenchViewState {
@@ -388,7 +395,7 @@ export class WorkbenchView extends React.PureComponent<WorkbenchViewProps, Workb
             WorkbenchQuery.blank()
               .changeQueryString(converted.queryString)
               .changeQueryContext(converted.queryContext || {}),
-            'Convert ' + getSpecDatasourceName(spec as any),
+            `Convert ${getSpecDatasourceName(spec as any) || 'spec'}`,
           );
         }}
         onClose={() => this.setState({ specDialogOpen: false })}
@@ -628,8 +635,14 @@ export class WorkbenchView extends React.PureComponent<WorkbenchViewProps, Workb
   }
 
   private renderCenterPanel() {
-    const { capabilities, mandatoryQueryContext, queryEngines, allowExplain, goToTask } =
-      this.props;
+    const {
+      capabilities,
+      mandatoryQueryContext,
+      queryEngines,
+      allowExplain,
+      goToTask,
+      getClusterCapacity,
+    } = this.props;
     const { columnMetadataState } = this.state;
     const currentTabEntry = this.getCurrentTabEntry();
     const effectiveEngine = currentTabEntry.query.getEffectiveEngine();
@@ -650,8 +663,9 @@ export class WorkbenchView extends React.PureComponent<WorkbenchViewProps, Workb
           onQueryTab={this.handleNewTab}
           onDetails={this.handleDetails}
           queryEngines={queryEngines}
-          clusterCapacity={capabilities.getClusterCapacity()}
+          clusterCapacity={capabilities.getMaxTaskSlots()}
           goToTask={goToTask}
+          getClusterCapacity={getClusterCapacity}
           runMoreMenu={
             <Menu>
               {allowExplain &&

From dca31d466c90f9bf2faa1fa0a0f6e7aab62c8fb5 Mon Sep 17 00:00:00 2001
From: Clint Wylie <cwylie@apache.org>
Date: Thu, 11 Jul 2024 16:57:15 -0700
Subject: [PATCH 60/72] minor adjustments for performance (#16714)

changes:
* switch to stop using some string.format
* switch some streams to classic loops
---
 .../epinephelinae/GroupByQueryEngine.java     | 35 +++++-----
 .../vector/VectorGroupByEngine.java           | 67 +++++++++++--------
 .../timeseries/TimeseriesQueryEngine.java     |  3 +-
 .../apache/druid/segment/VirtualColumns.java  |  7 +-
 .../CompressedNestedDataComplexColumn.java    | 13 ++--
 .../NestedCommonFormatColumnSerializer.java   |  2 +-
 .../nested/NestedDataColumnSerializerV4.java  | 10 +--
 7 files changed, 73 insertions(+), 64 deletions(-)

diff --git a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/GroupByQueryEngine.java b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/GroupByQueryEngine.java
index 085e6022aab..35f09c5446d 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/GroupByQueryEngine.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/GroupByQueryEngine.java
@@ -211,24 +211,25 @@ public class GroupByQueryEngine
       final List<DimensionSpec> dimensions
   )
   {
-    return dimensions
-        .stream()
-        .allMatch(
-            dimension -> {
-              if (dimension.mustDecorate()) {
-                // DimensionSpecs that decorate may turn singly-valued columns into multi-valued selectors.
-                // To be safe, we must return false here.
-                return false;
-              }
+    for (DimensionSpec dimension : dimensions) {
+      if (dimension.mustDecorate()) {
+        // DimensionSpecs that decorate may turn singly-valued columns into multi-valued selectors.
+        // To be safe, we must return false here.
+        return false;
+      }
 
-              // Now check column capabilities, which must be present and explicitly not multi-valued and not arrays
-              final ColumnCapabilities columnCapabilities = inspector.getColumnCapabilities(dimension.getDimension());
-              return dimension.getOutputType().isArray()
-                     || (columnCapabilities != null
-                         && columnCapabilities.hasMultipleValues().isFalse()
-                         && !columnCapabilities.isArray()
-                     );
-            });
+      // if dimension spec type is array, skip it since we can handle array or multi-valued
+      if (dimension.getOutputType().isArray()) {
+        continue;
+      }
+
+      // Now check column capabilities, which must be present and explicitly not multi-valued and not arrays
+      final ColumnCapabilities capabilities = inspector.getColumnCapabilities(dimension.getDimension());
+      if (capabilities == null || capabilities.hasMultipleValues().isMaybeTrue() || capabilities.isArray()) {
+        return false;
+      }
+    }
+    return true;
   }
 
   private abstract static class GroupByEngineIterator<KeyType> implements Iterator<ResultRow>, Closeable
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java
index 93633644a2e..75f4539e8c3 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/vector/VectorGroupByEngine.java
@@ -29,6 +29,7 @@ import org.apache.druid.java.util.common.io.Closer;
 import org.apache.druid.java.util.common.parsers.CloseableIterator;
 import org.apache.druid.query.DruidProcessingConfig;
 import org.apache.druid.query.aggregation.AggregatorAdapters;
+import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.dimension.DefaultDimensionSpec;
 import org.apache.druid.query.dimension.DimensionSpec;
 import org.apache.druid.query.filter.Filter;
@@ -204,9 +205,7 @@ public class VectorGroupByEngine
     return adapter.canVectorize(filter, query.getVirtualColumns(), false)
            && canVectorizeDimensions(inspector, query.getDimensions())
            && VirtualColumns.shouldVectorize(query, query.getVirtualColumns(), adapter)
-           && query.getAggregatorSpecs()
-                   .stream()
-                   .allMatch(aggregatorFactory -> aggregatorFactory.canVectorize(inspector));
+           && canVectorizeAggregators(inspector, query.getAggregatorSpecs());
   }
 
   private static boolean canVectorizeDimensions(
@@ -214,35 +213,45 @@ public class VectorGroupByEngine
       final List<DimensionSpec> dimensions
   )
   {
-    return dimensions
-        .stream()
-        .allMatch(
-            dimension -> {
-              if (!dimension.canVectorize()) {
-                return false;
-              }
+    for (DimensionSpec dimension : dimensions) {
+      if (!dimension.canVectorize()) {
+        return false;
+      }
 
-              if (dimension.mustDecorate()) {
-                // group by on multi value dimensions are not currently supported
-                // DimensionSpecs that decorate may turn singly-valued columns into multi-valued selectors.
-                // To be safe, we must return false here.
-                return false;
-              }
+      if (dimension.mustDecorate()) {
+        // group by on multi value dimensions are not currently supported
+        // DimensionSpecs that decorate may turn singly-valued columns into multi-valued selectors.
+        // To be safe, we must return false here.
+        return false;
+      }
 
-              if (!dimension.getOutputType().isPrimitive()) {
-                // group by on arrays and complex types is not currently supported in the vector processing engine
-                return false;
-              }
+      if (!dimension.getOutputType().isPrimitive()) {
+        // group by on arrays and complex types is not currently supported in the vector processing engine
+        return false;
+      }
 
-              // Now check column capabilities.
-              final ColumnCapabilities columnCapabilities = inspector.getColumnCapabilities(dimension.getDimension());
-              // null here currently means the column does not exist, nil columns can be vectorized
-              if (columnCapabilities == null) {
-                return true;
-              }
-              // must be single valued
-              return columnCapabilities.hasMultipleValues().isFalse();
-            });
+      // Now check column capabilities.
+      final ColumnCapabilities columnCapabilities = inspector.getColumnCapabilities(dimension.getDimension());
+      if (columnCapabilities != null && columnCapabilities.hasMultipleValues().isMaybeTrue()) {
+        // null here currently means the column does not exist, nil columns can be vectorized
+        // multi-value columns implicit unnest is not currently supported in the vector processing engine
+        return false;
+      }
+    }
+    return true;
+  }
+
+  public static boolean canVectorizeAggregators(
+      final ColumnInspector inspector,
+      final List<AggregatorFactory> aggregatorFactories
+  )
+  {
+    for (AggregatorFactory aggregatorFactory : aggregatorFactories) {
+      if (!aggregatorFactory.canVectorize(inspector)) {
+        return false;
+      }
+    }
+    return true;
   }
 
   @VisibleForTesting
diff --git a/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryEngine.java b/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryEngine.java
index c5e83b84e87..d8369c8c6da 100644
--- a/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryEngine.java
+++ b/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryEngine.java
@@ -37,6 +37,7 @@ import org.apache.druid.query.aggregation.Aggregator;
 import org.apache.druid.query.aggregation.AggregatorAdapters;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.filter.Filter;
+import org.apache.druid.query.groupby.epinephelinae.vector.VectorGroupByEngine;
 import org.apache.druid.query.vector.VectorCursorGranularizer;
 import org.apache.druid.segment.ColumnInspector;
 import org.apache.druid.segment.SegmentMissingException;
@@ -103,7 +104,7 @@ public class TimeseriesQueryEngine
     final boolean doVectorize = query.context().getVectorize().shouldVectorize(
         adapter.canVectorize(filter, query.getVirtualColumns(), descending)
         && VirtualColumns.shouldVectorize(query, query.getVirtualColumns(), adapter)
-        && query.getAggregatorSpecs().stream().allMatch(aggregatorFactory -> aggregatorFactory.canVectorize(inspector))
+        && VectorGroupByEngine.canVectorizeAggregators(inspector, query.getAggregatorSpecs())
     );
 
     final Sequence<Result<TimeseriesResultValue>> result;
diff --git a/processing/src/main/java/org/apache/druid/segment/VirtualColumns.java b/processing/src/main/java/org/apache/druid/segment/VirtualColumns.java
index 79354a4fa2a..a32a85d16c7 100644
--- a/processing/src/main/java/org/apache/druid/segment/VirtualColumns.java
+++ b/processing/src/main/java/org/apache/druid/segment/VirtualColumns.java
@@ -266,7 +266,12 @@ public class VirtualColumns implements Cacheable
   public boolean canVectorize(ColumnInspector columnInspector)
   {
     final ColumnInspector inspector = wrapInspector(columnInspector);
-    return virtualColumns.stream().allMatch(virtualColumn -> virtualColumn.canVectorize(inspector));
+    for (VirtualColumn virtualColumn : virtualColumns) {
+      if (!virtualColumn.canVectorize(inspector)) {
+        return false;
+      }
+    }
+    return true;
   }
 
   /**
diff --git a/processing/src/main/java/org/apache/druid/segment/nested/CompressedNestedDataComplexColumn.java b/processing/src/main/java/org/apache/druid/segment/nested/CompressedNestedDataComplexColumn.java
index d3869bd9ef5..7faf837db1c 100644
--- a/processing/src/main/java/org/apache/druid/segment/nested/CompressedNestedDataComplexColumn.java
+++ b/processing/src/main/java/org/apache/druid/segment/nested/CompressedNestedDataComplexColumn.java
@@ -25,6 +25,7 @@ import com.google.common.collect.ImmutableList;
 import com.google.common.collect.Sets;
 import com.google.common.primitives.Doubles;
 import org.apache.druid.collections.bitmap.ImmutableBitmap;
+import org.apache.druid.error.DruidException;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.RE;
@@ -915,13 +916,11 @@ public abstract class CompressedNestedDataComplexColumn<TStringDictionary extend
       );
       // we should check this someday soon, but for now just read it to push the buffer position ahead
       int flags = dataBuffer.getInt();
-      Preconditions.checkState(
-          flags == DictionaryEncodedColumnPartSerde.NO_FLAGS,
-          StringUtils.format(
-              "Unrecognized bits set in space reserved for future flags for field column [%s]",
-              field
-          )
-      );
+      if (flags != DictionaryEncodedColumnPartSerde.NO_FLAGS) {
+        throw DruidException.defensive(
+            "Unrecognized bits set in space reserved for future flags for field column [%s]", field
+        );
+      }
 
       final Supplier<FixedIndexed<Integer>> localDictionarySupplier = FixedIndexed.read(
           dataBuffer,
diff --git a/processing/src/main/java/org/apache/druid/segment/nested/NestedCommonFormatColumnSerializer.java b/processing/src/main/java/org/apache/druid/segment/nested/NestedCommonFormatColumnSerializer.java
index 59c7da7fd21..68e1da96756 100644
--- a/processing/src/main/java/org/apache/druid/segment/nested/NestedCommonFormatColumnSerializer.java
+++ b/processing/src/main/java/org/apache/druid/segment/nested/NestedCommonFormatColumnSerializer.java
@@ -123,6 +123,6 @@ public abstract class NestedCommonFormatColumnSerializer implements GenericColum
    */
   public static String getInternalFileName(String fileNameBase, String field)
   {
-    return StringUtils.format("%s.%s", fileNameBase, field);
+    return fileNameBase + "." + field;
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/segment/nested/NestedDataColumnSerializerV4.java b/processing/src/main/java/org/apache/druid/segment/nested/NestedDataColumnSerializerV4.java
index efa31a13a3f..3d39b31bbbc 100644
--- a/processing/src/main/java/org/apache/druid/segment/nested/NestedDataColumnSerializerV4.java
+++ b/processing/src/main/java/org/apache/druid/segment/nested/NestedDataColumnSerializerV4.java
@@ -27,7 +27,6 @@ import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.java.util.common.FileUtils;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.RE;
-import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.io.Closer;
 import org.apache.druid.java.util.common.io.smoosh.FileSmoosher;
 import org.apache.druid.java.util.common.io.smoosh.SmooshedWriter;
@@ -182,7 +181,7 @@ public class NestedDataColumnSerializerV4 implements GenericColumnSerializer<Str
     doubleDictionaryWriter.open();
 
     rawWriter = new CompressedVariableSizedBlobColumnSerializer(
-        getInternalFileName(name, RAW_FILE_NAME),
+        NestedCommonFormatColumnSerializer.getInternalFileName(name, RAW_FILE_NAME),
         segmentWriteOutMedium,
         indexSpec.getJsonCompression() != null ? indexSpec.getJsonCompression() : CompressionStrategy.LZ4
     );
@@ -390,14 +389,9 @@ public class NestedDataColumnSerializerV4 implements GenericColumnSerializer<Str
 
   private void writeInternal(FileSmoosher smoosher, Serializer serializer, String fileName) throws IOException
   {
-    final String internalName = getInternalFileName(name, fileName);
+    final String internalName = NestedCommonFormatColumnSerializer.getInternalFileName(name, fileName);
     try (SmooshedWriter smooshChannel = smoosher.addWithSmooshedWriter(internalName, serializer.getSerializedSize())) {
       serializer.writeTo(smooshChannel, smoosher);
     }
   }
-
-  public static String getInternalFileName(String fileNameBase, String field)
-  {
-    return StringUtils.format("%s.%s", fileNameBase, field);
-  }
 }

From eb981d855fc0d4ef25f820e1de45d0f2660b226f Mon Sep 17 00:00:00 2001
From: Sree Charan Manamala <sree.manamala@imply.io>
Date: Fri, 12 Jul 2024 12:48:09 +0530
Subject: [PATCH 61/72] Correct aggregators violating names (#16615)

In case of few aggregators for example BloomSqlAggregator, BaseVarianceSqlAggregator etc, the aggName is being updated from a0 to a0:agg, breaching the contract as we would expect the aggName as the name which is passed. This is causing a mismatch while creating a column accessor.

This commit aims to correct those violating sql aggregators.
---
 ...CompressedBigDecimalSqlAggregatorBase.java |  3 +-
 ...ressedBigDecimalSqlAggregatorTestBase.java | 26 ++++----
 .../TDigestGenerateSketchSqlAggregator.java   |  6 +-
 .../sql/TDigestSketchSqlAggregatorTest.java   | 16 ++---
 .../sql/DoublesSketchObjectSqlAggregator.java |  6 +-
 .../sql/DoublesSketchSqlAggregatorTest.java   | 46 +++++++--------
 .../bloom/sql/BloomFilterSqlAggregator.java   |  3 +-
 .../sql/BloomFilterSqlAggregatorTest.java     | 24 ++++----
 .../sql/BaseVarianceSqlAggregator.java        | 13 ++--
 .../sql/VarianceSqlAggregatorTest.java        | 59 ++++++++++++++-----
 10 files changed, 114 insertions(+), 88 deletions(-)

diff --git a/extensions-contrib/compressed-bigdecimal/src/main/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorBase.java b/extensions-contrib/compressed-bigdecimal/src/main/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorBase.java
index 33c010b58cc..8ce60b1a5f3 100644
--- a/extensions-contrib/compressed-bigdecimal/src/main/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorBase.java
+++ b/extensions-contrib/compressed-bigdecimal/src/main/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorBase.java
@@ -32,7 +32,6 @@ import org.apache.calcite.sql.type.ReturnTypes;
 import org.apache.calcite.sql.type.SqlTypeFamily;
 import org.apache.calcite.sql.type.SqlTypeName;
 import org.apache.calcite.util.Optionality;
-import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.sql.calcite.aggregation.Aggregation;
@@ -130,7 +129,7 @@ public abstract class CompressedBigDecimalSqlAggregatorBase implements SqlAggreg
 
     // create the factory
     AggregatorFactory aggregatorFactory = factoryCreator.create(
-        StringUtils.format("%s:agg", name),
+        name,
         sumColumnName,
         size,
         scale,
diff --git a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorTestBase.java b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorTestBase.java
index 671aa9aa084..5227700bb7c 100644
--- a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorTestBase.java
+++ b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorTestBase.java
@@ -165,9 +165,9 @@ public abstract class CompressedBigDecimalSqlAggregatorTestBase extends BaseCalc
                   .intervals(new MultipleIntervalSegmentSpec(ImmutableList.of(Filtration.eternity())))
                   .granularity(Granularities.ALL)
                   .aggregators(
-                      factoryCreator.create("a0:agg", "m1", 9, 9, false),
-                      factoryCreator.create("a1:agg", "m2", 9, 9, false),
-                      factoryCreator.create("a2:agg", "dim1", 9, 9, false)
+                      factoryCreator.create("a0", "m1", 9, 9, false),
+                      factoryCreator.create("a1", "m2", 9, 9, false),
+                      factoryCreator.create("a2", "dim1", 9, 9, false)
 
                   )
                   .context(QUERY_CONTEXT_DEFAULT)
@@ -190,7 +190,7 @@ public abstract class CompressedBigDecimalSqlAggregatorTestBase extends BaseCalc
                   .dataSource(CalciteTests.DATASOURCE1)
                   .intervals(new MultipleIntervalSegmentSpec(ImmutableList.of(Filtration.eternity())))
                   .granularity(Granularities.ALL)
-                  .aggregators(factoryCreator.create("a0:agg", "dim1", 9, 9, true))
+                  .aggregators(factoryCreator.create("a0", "dim1", 9, 9, true))
                   .context(QUERY_CONTEXT_DEFAULT)
                   .build()
         ),
@@ -218,9 +218,9 @@ public abstract class CompressedBigDecimalSqlAggregatorTestBase extends BaseCalc
                   .intervals(new MultipleIntervalSegmentSpec(ImmutableList.of(Filtration.eternity())))
                   .granularity(Granularities.ALL)
                   .aggregators(
-                      factoryCreator.create("a0:agg", "m1", 9, 3, false),
-                      factoryCreator.create("a1:agg", "m2", 9, 3, false),
-                      factoryCreator.create("a2:agg", "dim1", 9, 3, false)
+                      factoryCreator.create("a0", "m1", 9, 3, false),
+                      factoryCreator.create("a1", "m2", 9, 3, false),
+                      factoryCreator.create("a2", "dim1", 9, 3, false)
                   )
                   .context(QUERY_CONTEXT_DEFAULT)
                   .build()
@@ -249,9 +249,9 @@ public abstract class CompressedBigDecimalSqlAggregatorTestBase extends BaseCalc
                   .intervals(new MultipleIntervalSegmentSpec(ImmutableList.of(Filtration.eternity())))
                   .granularity(Granularities.ALL)
                   .aggregators(
-                      factoryCreator.create("a0:agg", "m1", 9, 9, false),
-                      factoryCreator.create("a1:agg", "m2", 9, 9, false),
-                      factoryCreator.create("a2:agg", "dim1", 9, 9, false)
+                      factoryCreator.create("a0", "m1", 9, 9, false),
+                      factoryCreator.create("a1", "m2", 9, 9, false),
+                      factoryCreator.create("a2", "dim1", 9, 9, false)
                   )
                   .context(QUERY_CONTEXT_DEFAULT)
                   .build()
@@ -275,9 +275,9 @@ public abstract class CompressedBigDecimalSqlAggregatorTestBase extends BaseCalc
                   .intervals(new MultipleIntervalSegmentSpec(ImmutableList.of(Filtration.eternity())))
                   .granularity(Granularities.ALL)
                   .aggregators(
-                      factoryCreator.create("a0:agg", "m1", 6, 9, false),
-                      factoryCreator.create("a1:agg", "m2", 6, 9, false),
-                      factoryCreator.create("a2:agg", "dim1", 6, 9, false)
+                      factoryCreator.create("a0", "m1", 6, 9, false),
+                      factoryCreator.create("a1", "m2", 6, 9, false),
+                      factoryCreator.create("a2", "dim1", 6, 9, false)
                   )
                   .context(QUERY_CONTEXT_DEFAULT)
                   .build()
diff --git a/extensions-contrib/tdigestsketch/src/main/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestGenerateSketchSqlAggregator.java b/extensions-contrib/tdigestsketch/src/main/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestGenerateSketchSqlAggregator.java
index 1777ce5c544..5604622755a 100644
--- a/extensions-contrib/tdigestsketch/src/main/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestGenerateSketchSqlAggregator.java
+++ b/extensions-contrib/tdigestsketch/src/main/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestGenerateSketchSqlAggregator.java
@@ -27,7 +27,6 @@ import org.apache.calcite.sql.SqlFunctionCategory;
 import org.apache.calcite.sql.SqlKind;
 import org.apache.calcite.sql.type.SqlTypeFamily;
 import org.apache.calcite.util.Optionality;
-import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.aggregation.tdigestsketch.TDigestSketchAggregatorFactory;
 import org.apache.druid.query.aggregation.tdigestsketch.TDigestSketchUtils;
@@ -79,7 +78,6 @@ public class TDigestGenerateSketchSqlAggregator implements SqlAggregator
     }
 
     final AggregatorFactory aggregatorFactory;
-    final String aggName = StringUtils.format("%s:agg", name);
 
     Integer compression = TDigestSketchAggregatorFactory.DEFAULT_COMPRESSION;
     if (aggregateCall.getArgList().size() > 1) {
@@ -116,7 +114,7 @@ public class TDigestGenerateSketchSqlAggregator implements SqlAggregator
     // No existing match found. Create a new one.
     if (input.isDirectColumnAccess()) {
       aggregatorFactory = new TDigestSketchAggregatorFactory(
-          aggName,
+          name,
           input.getDirectColumn(),
           compression
       );
@@ -125,7 +123,7 @@ public class TDigestGenerateSketchSqlAggregator implements SqlAggregator
           input,
           ColumnType.FLOAT
       );
-      aggregatorFactory = new TDigestSketchAggregatorFactory(aggName, virtualColumnName, compression);
+      aggregatorFactory = new TDigestSketchAggregatorFactory(name, virtualColumnName, compression);
     }
 
     return Aggregation.create(aggregatorFactory);
diff --git a/extensions-contrib/tdigestsketch/src/test/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestSketchSqlAggregatorTest.java b/extensions-contrib/tdigestsketch/src/test/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestSketchSqlAggregatorTest.java
index c4913667cb0..2a53ef0369b 100644
--- a/extensions-contrib/tdigestsketch/src/test/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestSketchSqlAggregatorTest.java
+++ b/extensions-contrib/tdigestsketch/src/test/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestSketchSqlAggregatorTest.java
@@ -135,7 +135,7 @@ public class TDigestSketchSqlAggregatorTest extends BaseCalciteQueryTest
                   .intervals(new MultipleIntervalSegmentSpec(ImmutableList.of(Filtration.eternity())))
                   .granularity(Granularities.ALL)
                   .aggregators(ImmutableList.of(
-                      new TDigestSketchAggregatorFactory("a0:agg", "m1", 200)
+                      new TDigestSketchAggregatorFactory("a0", "m1", 200)
                   ))
                   .context(QUERY_CONTEXT_DEFAULT)
                   .build()
@@ -205,7 +205,7 @@ public class TDigestSketchSqlAggregatorTest extends BaseCalciteQueryTest
                   .intervals(new MultipleIntervalSegmentSpec(ImmutableList.of(Filtration.eternity())))
                   .granularity(Granularities.ALL)
                   .aggregators(ImmutableList.of(
-                      new TDigestSketchAggregatorFactory("a0:agg", "m1", 200)
+                      new TDigestSketchAggregatorFactory("a0", "m1", 200)
                   ))
                   .context(QUERY_CONTEXT_DEFAULT)
                   .build()
@@ -242,7 +242,7 @@ public class TDigestSketchSqlAggregatorTest extends BaseCalciteQueryTest
                       )
                   )
                   .aggregators(ImmutableList.of(
-                      new TDigestSketchAggregatorFactory("a0:agg", "v0", 200)
+                      new TDigestSketchAggregatorFactory("a0", "v0", 200)
                   ))
                   .context(QUERY_CONTEXT_DEFAULT)
                   .build()
@@ -275,7 +275,7 @@ public class TDigestSketchSqlAggregatorTest extends BaseCalciteQueryTest
                   .intervals(new MultipleIntervalSegmentSpec(ImmutableList.of(Filtration.eternity())))
                   .granularity(Granularities.ALL)
                   .aggregators(ImmutableList.of(
-                      new TDigestSketchAggregatorFactory("a0:agg", "m1", TDigestSketchAggregatorFactory.DEFAULT_COMPRESSION)
+                      new TDigestSketchAggregatorFactory("a0", "m1", TDigestSketchAggregatorFactory.DEFAULT_COMPRESSION)
                   ))
                   .context(QUERY_CONTEXT_DEFAULT)
                   .build()
@@ -357,7 +357,7 @@ public class TDigestSketchSqlAggregatorTest extends BaseCalciteQueryTest
                                             .setDimensions(new DefaultDimensionSpec("dim1", "d0"))
                                             .setAggregatorSpecs(
                                                 ImmutableList.of(
-                                                    new TDigestSketchAggregatorFactory("a0:agg", "m1", 200)
+                                                    new TDigestSketchAggregatorFactory("a0", "m1", 200)
                                                 )
                                             )
                                             .setContext(QUERY_CONTEXT_DEFAULT)
@@ -368,7 +368,7 @@ public class TDigestSketchSqlAggregatorTest extends BaseCalciteQueryTest
                         .setGranularity(Granularities.ALL)
                         .setAggregatorSpecs(
                             ImmutableList.of(
-                                new TDigestSketchAggregatorFactory("_a0:agg", "a0:agg", 100)
+                                new TDigestSketchAggregatorFactory("_a0:agg", "a0", 100)
                             )
                         )
                         .setPostAggregatorSpecs(
@@ -534,7 +534,7 @@ public class TDigestSketchSqlAggregatorTest extends BaseCalciteQueryTest
                   .filters(numericEquality("dim2", 0L, ColumnType.LONG))
                   .granularity(Granularities.ALL)
                   .aggregators(ImmutableList.of(
-                      new TDigestSketchAggregatorFactory("a0:agg", "m1", TDigestSketchAggregatorFactory.DEFAULT_COMPRESSION),
+                      new TDigestSketchAggregatorFactory("a0", "m1", TDigestSketchAggregatorFactory.DEFAULT_COMPRESSION),
                       new TDigestSketchAggregatorFactory("a1:agg", "qsketch_m1", 100)
                   ))
                   .postAggregators(
@@ -571,7 +571,7 @@ public class TDigestSketchSqlAggregatorTest extends BaseCalciteQueryTest
                         .setAggregatorSpecs(
                             aggregators(
                                 new FilteredAggregatorFactory(
-                                    new TDigestSketchAggregatorFactory("a0:agg", "m1", TDigestSketchAggregatorFactory.DEFAULT_COMPRESSION),
+                                    new TDigestSketchAggregatorFactory("a0", "m1", TDigestSketchAggregatorFactory.DEFAULT_COMPRESSION),
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 ),
                                 new FilteredAggregatorFactory(
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchObjectSqlAggregator.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchObjectSqlAggregator.java
index 15b15b0dc21..55973c093d6 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchObjectSqlAggregator.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchObjectSqlAggregator.java
@@ -27,7 +27,6 @@ import org.apache.calcite.sql.SqlAggFunction;
 import org.apache.calcite.sql.SqlFunctionCategory;
 import org.apache.calcite.sql.SqlKind;
 import org.apache.calcite.sql.type.SqlTypeFamily;
-import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.aggregation.datasketches.SketchQueryContext;
 import org.apache.druid.query.aggregation.datasketches.quantiles.DoublesSketchAggregatorFactory;
@@ -89,7 +88,6 @@ public class DoublesSketchObjectSqlAggregator implements SqlAggregator
     }
 
     final AggregatorFactory aggregatorFactory;
-    final String histogramName = StringUtils.format("%s:agg", name);
     final int k;
 
     if (aggregateCall.getArgList().size() >= 2) {
@@ -108,7 +106,7 @@ public class DoublesSketchObjectSqlAggregator implements SqlAggregator
     // No existing match found. Create a new one.
     if (input.isDirectColumnAccess()) {
       aggregatorFactory = new DoublesSketchAggregatorFactory(
-          histogramName,
+          name,
           input.getDirectColumn(),
           k,
           DoublesSketchApproxQuantileSqlAggregator.getMaxStreamLengthFromQueryContext(plannerContext.queryContext()),
@@ -120,7 +118,7 @@ public class DoublesSketchObjectSqlAggregator implements SqlAggregator
           ColumnType.FLOAT
       );
       aggregatorFactory = new DoublesSketchAggregatorFactory(
-          histogramName,
+          name,
           virtualColumnName,
           k,
           DoublesSketchApproxQuantileSqlAggregator.getMaxStreamLengthFromQueryContext(plannerContext.queryContext()),
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java
index bce6a306c80..9122e1ecc7e 100644
--- a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java
@@ -539,8 +539,8 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(ImmutableList.of(
                       new LongSumAggregatorFactory("a0", "cnt"),
                       new DoublesSketchAggregatorFactory("a1:agg", "cnt", 128),
-                      new DoublesSketchAggregatorFactory("a2:agg", "cnt", 128, null, false),
-                      new DoublesSketchAggregatorFactory("a3:agg", "v0", 128, null, false)
+                      new DoublesSketchAggregatorFactory("a2", "cnt", 128, null, false),
+                      new DoublesSketchAggregatorFactory("a3", "v0", 128, null, false)
                   ))
                   .postAggregators(
                       new DoublesSketchToQuantilePostAggregator(
@@ -557,7 +557,7 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                           "p2",
                           new FieldAccessPostAggregator(
                               "p1",
-                              "a2:agg"
+                              "a2"
                           ),
                           0.5f
                       ),
@@ -570,7 +570,7 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                           "p5",
                           new FieldAccessPostAggregator(
                               "p4",
-                              "a3:agg"
+                              "a3"
                           ),
                           0.5f
                       ),
@@ -583,7 +583,7 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                           "p8",
                           new FieldAccessPostAggregator(
                               "p7",
-                              "a2:agg"
+                              "a2"
                           ),
                           0.5f
                       ),
@@ -592,7 +592,7 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                           "p11",
                           new FieldAccessPostAggregator(
                               "p10",
-                              "a2:agg"
+                              "a2"
                           ),
                           new double[]{0.5d, 0.8d}
                       ),
@@ -600,7 +600,7 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                           "p13",
                           new FieldAccessPostAggregator(
                               "p12",
-                              "a2:agg"
+                              "a2"
                           ),
                           new double[]{0.5d, 0.8d}
                       ),
@@ -608,7 +608,7 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                           "p15",
                           new FieldAccessPostAggregator(
                               "p14",
-                              "a2:agg"
+                              "a2"
                           ),
                           new double[]{0.2d, 0.6d},
                           null
@@ -617,7 +617,7 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                           "p17",
                           new FieldAccessPostAggregator(
                               "p16",
-                              "a2:agg"
+                              "a2"
                           ),
                           3.0d
                       ),
@@ -625,7 +625,7 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                           "p19",
                           new FieldAccessPostAggregator(
                               "p18",
-                              "a2:agg"
+                              "a2"
                           ),
                           new double[]{0.2d, 0.6d}
                       ),
@@ -633,7 +633,7 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                           "p21",
                           new FieldAccessPostAggregator(
                               "p20",
-                              "a2:agg"
+                              "a2"
                           )
                       ),
                       expressionPostAgg(
@@ -697,24 +697,24 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                   .granularity(Granularities.ALL)
                   .aggregators(
                       ImmutableList.of(
-                          new DoublesSketchAggregatorFactory("a0:agg", "m1", 128, null, false)
+                          new DoublesSketchAggregatorFactory("a0", "m1", 128, null, false)
                       )
                   )
                   .postAggregators(
                       ImmutableList.of(
                           new DoublesSketchToQuantilePostAggregator(
                               "p1",
-                              new FieldAccessPostAggregator("p0", "a0:agg"),
+                              new FieldAccessPostAggregator("p0", "a0"),
                               0.5
                           ),
                           new DoublesSketchToQuantilePostAggregator(
                               "s1",
-                              new FieldAccessPostAggregator("s0", "a0:agg"),
+                              new FieldAccessPostAggregator("s0", "a0"),
                               0.5
                           ),
                           new DoublesSketchToQuantilePostAggregator(
                               "s3",
-                              new FieldAccessPostAggregator("s2", "a0:agg"),
+                              new FieldAccessPostAggregator("s2", "a0"),
                               0.9800000190734863
                           )
                       )
@@ -750,8 +750,8 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(ImmutableList.of(
                       new DoublesSketchAggregatorFactory("a0:agg", "m1", null),
                       new DoublesSketchAggregatorFactory("a1:agg", "qsketch_m1", null),
-                      new DoublesSketchAggregatorFactory("a2:agg", "m1", null, null, false),
-                      new DoublesSketchAggregatorFactory("a3:agg", "qsketch_m1", null, null, false)
+                      new DoublesSketchAggregatorFactory("a2", "m1", null, null, false),
+                      new DoublesSketchAggregatorFactory("a3", "qsketch_m1", null, null, false)
                   ))
                   .postAggregators(
                       new DoublesSketchToQuantilePostAggregator("a0", makeFieldAccessPostAgg("a0:agg"), 0.01f),
@@ -797,8 +797,8 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(ImmutableList.of(
                       new DoublesSketchAggregatorFactory("a0:agg", "m1", null),
                       new DoublesSketchAggregatorFactory("a1:agg", "qsketch_m1", null),
-                      new DoublesSketchAggregatorFactory("a2:agg", "m1", null, null, true),
-                      new DoublesSketchAggregatorFactory("a3:agg", "qsketch_m1", null, null, true)
+                      new DoublesSketchAggregatorFactory("a2", "m1", null, null, true),
+                      new DoublesSketchAggregatorFactory("a3", "qsketch_m1", null, null, true)
                   ))
                   .postAggregators(
                       new DoublesSketchToQuantilePostAggregator("a0", makeFieldAccessPostAgg("a0:agg"), 0.01f),
@@ -848,11 +848,11 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 ),
                                 new FilteredAggregatorFactory(
-                                    new DoublesSketchAggregatorFactory("a2:agg", "m1", null, null, false),
+                                    new DoublesSketchAggregatorFactory("a2", "m1", null, null, false),
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 ),
                                 new FilteredAggregatorFactory(
-                                    new DoublesSketchAggregatorFactory("a3:agg", "qsketch_m1", null, null, false),
+                                    new DoublesSketchAggregatorFactory("a3", "qsketch_m1", null, null, false),
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 )
                             )
@@ -919,11 +919,11 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 ),
                                 new FilteredAggregatorFactory(
-                                    new DoublesSketchAggregatorFactory("a2:agg", "m1", null, null, true),
+                                    new DoublesSketchAggregatorFactory("a2", "m1", null, null, true),
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 ),
                                 new FilteredAggregatorFactory(
-                                    new DoublesSketchAggregatorFactory("a3:agg", "qsketch_m1", null, null, true),
+                                    new DoublesSketchAggregatorFactory("a3", "qsketch_m1", null, null, true),
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 )
                             )
diff --git a/extensions-core/druid-bloom-filter/src/main/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregator.java b/extensions-core/druid-bloom-filter/src/main/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregator.java
index 5beb6c64232..209fe3500f4 100644
--- a/extensions-core/druid-bloom-filter/src/main/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregator.java
+++ b/extensions-core/druid-bloom-filter/src/main/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregator.java
@@ -81,7 +81,6 @@ public class BloomFilterSqlAggregator implements SqlAggregator
     }
 
     final AggregatorFactory aggregatorFactory;
-    final String aggName = StringUtils.format("%s:agg", name);
     final RexNode maxNumEntriesOperand = inputAccessor.getField(aggregateCall.getArgList().get(1));
 
     if (!maxNumEntriesOperand.isA(SqlKind.LITERAL)) {
@@ -157,7 +156,7 @@ public class BloomFilterSqlAggregator implements SqlAggregator
     }
 
     aggregatorFactory = new BloomFilterAggregatorFactory(
-        aggName,
+        name,
         spec,
         maxNumEntries
     );
diff --git a/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregatorTest.java b/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregatorTest.java
index cfb4209cb3b..7de8ef8280c 100644
--- a/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregatorTest.java
+++ b/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregatorTest.java
@@ -148,7 +148,7 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(
                       ImmutableList.of(
                           new BloomFilterAggregatorFactory(
-                              "a0:agg",
+                              "a0",
                               new DefaultDimensionSpec("dim1", "a0:dim1"),
                               TEST_NUM_ENTRIES
                           )
@@ -207,12 +207,12 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
               .aggregators(
                   ImmutableList.of(
                       new BloomFilterAggregatorFactory(
-                          "a0:agg",
+                          "a0",
                           new DefaultDimensionSpec("dim1", "a0:dim1"),
                           TEST_NUM_ENTRIES
                       ),
                       new BloomFilterAggregatorFactory(
-                          "a1:agg",
+                          "a1",
                           new DefaultDimensionSpec("dim2", "a1:dim2"),
                           TEST_NUM_ENTRIES
                       )
@@ -258,7 +258,7 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(
                       ImmutableList.of(
                           new BloomFilterAggregatorFactory(
-                              "a0:agg",
+                              "a0",
                               new ExtractionDimensionSpec(
                                   "dim1",
                                   "a0:dim1",
@@ -308,7 +308,7 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(
                       ImmutableList.of(
                           new BloomFilterAggregatorFactory(
-                              "a0:agg",
+                              "a0",
                               new DefaultDimensionSpec("l1", "a0:l1", ColumnType.LONG),
                               TEST_NUM_ENTRIES
                           )
@@ -361,7 +361,7 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(
                       ImmutableList.of(
                           new BloomFilterAggregatorFactory(
-                              "a0:agg",
+                              "a0",
                               new DefaultDimensionSpec("v0", "a0:v0"),
                               TEST_NUM_ENTRIES
                           )
@@ -415,7 +415,7 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(
                       ImmutableList.of(
                           new BloomFilterAggregatorFactory(
-                              "a0:agg",
+                              "a0",
                               new DefaultDimensionSpec("v0", "a0:v0"),
                               TEST_NUM_ENTRIES
                           )
@@ -469,7 +469,7 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(
                       ImmutableList.of(
                           new BloomFilterAggregatorFactory(
-                              "a0:agg",
+                              "a0",
                               new DefaultDimensionSpec("v0", "a0:v0"),
                               TEST_NUM_ENTRIES
                           )
@@ -508,12 +508,12 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
                   .aggregators(
                       ImmutableList.of(
                           new BloomFilterAggregatorFactory(
-                              "a0:agg",
+                              "a0",
                               new DefaultDimensionSpec("dim1", "a0:dim1"),
                               TEST_NUM_ENTRIES
                           ),
                           new BloomFilterAggregatorFactory(
-                              "a1:agg",
+                              "a1",
                               new DefaultDimensionSpec("l1", "a1:l1", ColumnType.LONG),
                               TEST_NUM_ENTRIES
                           )
@@ -559,7 +559,7 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
                             aggregators(
                                 new FilteredAggregatorFactory(
                                     new BloomFilterAggregatorFactory(
-                                        "a0:agg",
+                                        "a0",
                                         new DefaultDimensionSpec("dim1", "a0:dim1"),
                                         TEST_NUM_ENTRIES
                                     ),
@@ -567,7 +567,7 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
                                 ),
                                 new FilteredAggregatorFactory(
                                     new BloomFilterAggregatorFactory(
-                                        "a1:agg",
+                                        "a1",
                                         new DefaultDimensionSpec("l1", "a1:l1", ColumnType.LONG),
                                         TEST_NUM_ENTRIES
                                     ),
diff --git a/extensions-core/stats/src/main/java/org/apache/druid/query/aggregation/variance/sql/BaseVarianceSqlAggregator.java b/extensions-core/stats/src/main/java/org/apache/druid/query/aggregation/variance/sql/BaseVarianceSqlAggregator.java
index b2ed565d627..7621fae4bf7 100644
--- a/extensions-core/stats/src/main/java/org/apache/druid/query/aggregation/variance/sql/BaseVarianceSqlAggregator.java
+++ b/extensions-core/stats/src/main/java/org/apache/druid/query/aggregation/variance/sql/BaseVarianceSqlAggregator.java
@@ -97,8 +97,15 @@ public abstract class BaseVarianceSqlAggregator implements SqlAggregator
     final RelDataType dataType = inputOperand.getType();
     final ColumnType inputType = Calcites.getColumnTypeForRelDataType(dataType);
     final DimensionSpec dimensionSpec;
-    final String aggName = StringUtils.format("%s:agg", name);
     final SqlAggFunction func = calciteFunction();
+    boolean needsPostAggregator = false;
+    String aggName = name;
+    if (func.getName().equals(STDDEV_NAME)
+        || func.getName().equals(SqlKind.STDDEV_POP.name())
+        || func.getName().equals(SqlKind.STDDEV_SAMP.name())) {
+      needsPostAggregator = true;
+      aggName = StringUtils.format("%s:agg", name);
+    }
     final String estimator;
     final String inputTypeName;
     PostAggregator postAggregator = null;
@@ -136,9 +143,7 @@ public abstract class BaseVarianceSqlAggregator implements SqlAggregator
         inputTypeName
     );
 
-    if (func.getName().equals(STDDEV_NAME)
-        || func.getName().equals(SqlKind.STDDEV_POP.name())
-        || func.getName().equals(SqlKind.STDDEV_SAMP.name())) {
+    if (needsPostAggregator) {
       postAggregator = new StandardDeviationPostAggregator(
           name,
           aggregatorFactory.getName(),
diff --git a/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java b/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java
index 7c63d63aab8..f3e6406ecf3 100644
--- a/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java
+++ b/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java
@@ -20,6 +20,7 @@
 package org.apache.druid.query.aggregation.variance.sql;
 
 import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
 import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.InputRow;
@@ -32,6 +33,7 @@ import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.Druids;
+import org.apache.druid.query.QueryContexts;
 import org.apache.druid.query.QueryRunnerFactoryConglomerate;
 import org.apache.druid.query.aggregation.CountAggregatorFactory;
 import org.apache.druid.query.aggregation.DoubleSumAggregatorFactory;
@@ -61,6 +63,7 @@ import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.SqlTestFrameworkConfig;
 import org.apache.druid.sql.calcite.TempDirProducer;
 import org.apache.druid.sql.calcite.filtration.Filtration;
+import org.apache.druid.sql.calcite.planner.PlannerContext;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SqlTestFramework.StandardComponentSupplier;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
@@ -199,9 +202,9 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
                   .granularity(Granularities.ALL)
                   .aggregators(
                       ImmutableList.of(
-                          new VarianceAggregatorFactory("a0:agg", "d1", "population", "double"),
-                          new VarianceAggregatorFactory("a1:agg", "f1", "population", "float"),
-                          new VarianceAggregatorFactory("a2:agg", "l1", "population", "long")
+                          new VarianceAggregatorFactory("a0", "d1", "population", "double"),
+                          new VarianceAggregatorFactory("a1", "f1", "population", "float"),
+                          new VarianceAggregatorFactory("a2", "l1", "population", "long")
                       )
                   )
                   .context(BaseCalciteQueryTest.QUERY_CONTEXT_DEFAULT)
@@ -247,9 +250,9 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
                   .granularity(Granularities.ALL)
                   .aggregators(
                       ImmutableList.of(
-                          new VarianceAggregatorFactory("a0:agg", "d1", "sample", "double"),
-                          new VarianceAggregatorFactory("a1:agg", "f1", "sample", "float"),
-                          new VarianceAggregatorFactory("a2:agg", "l1", "sample", "long")
+                          new VarianceAggregatorFactory("a0", "d1", "sample", "double"),
+                          new VarianceAggregatorFactory("a1", "f1", "sample", "float"),
+                          new VarianceAggregatorFactory("a2", "l1", "sample", "long")
                       )
                   )
                   .context(BaseCalciteQueryTest.QUERY_CONTEXT_DEFAULT)
@@ -454,14 +457,14 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
                         .setGranularity(Granularities.ALL)
                         .setDimensions(new DefaultDimensionSpec("dim2", "_d0"))
                         .setAggregatorSpecs(
-                            new VarianceAggregatorFactory("a0:agg", "f1", "sample", "float")
+                            new VarianceAggregatorFactory("a0", "f1", "sample", "float")
                         )
                         .setLimitSpec(
                             DefaultLimitSpec
                                 .builder()
                                 .orderBy(
                                     new OrderByColumnSpec(
-                                        "a0:agg",
+                                        "a0",
                                         OrderByColumnSpec.Direction.DESCENDING,
                                         StringComparators.NUMERIC
                                     )
@@ -498,7 +501,7 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
                 new VarianceAggregatorFactory("a0:agg", "v0", "population", "double"),
                 new VarianceAggregatorFactory("a1:agg", "v0", "sample", "double"),
                 new VarianceAggregatorFactory("a2:agg", "v0", "sample", "double"),
-                new VarianceAggregatorFactory("a3:agg", "v0", "sample", "double")
+                new VarianceAggregatorFactory("a3", "v0", "sample", "double")
             )
             .postAggregators(
                 new StandardDeviationPostAggregator("a0", "a0:agg", "population"),
@@ -541,11 +544,11 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
                       new VarianceAggregatorFactory("a0:agg", "d1", "population", "double"),
                       new VarianceAggregatorFactory("a1:agg", "d1", "sample", "double"),
                       new VarianceAggregatorFactory("a2:agg", "d1", "sample", "double"),
-                      new VarianceAggregatorFactory("a3:agg", "d1", "sample", "double"),
+                      new VarianceAggregatorFactory("a3", "d1", "sample", "double"),
                       new VarianceAggregatorFactory("a4:agg", "l1", "population", "long"),
                       new VarianceAggregatorFactory("a5:agg", "l1", "sample", "long"),
                       new VarianceAggregatorFactory("a6:agg", "l1", "sample", "long"),
-                      new VarianceAggregatorFactory("a7:agg", "l1", "sample", "long")
+                      new VarianceAggregatorFactory("a7", "l1", "sample", "long")
 
                   )
                   .postAggregators(
@@ -606,7 +609,7 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 ),
                                 new FilteredAggregatorFactory(
-                                    new VarianceAggregatorFactory("a3:agg", "d1", "sample", "double"),
+                                    new VarianceAggregatorFactory("a3", "d1", "sample", "double"),
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 ),
                                 new FilteredAggregatorFactory(
@@ -622,7 +625,7 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 ),
                                 new FilteredAggregatorFactory(
-                                    new VarianceAggregatorFactory("a7:agg", "l1", "sample", "long"),
+                                    new VarianceAggregatorFactory("a7", "l1", "sample", "long"),
                                     equality("dim1", "nonexistent", ColumnType.STRING)
                                 )
                             )
@@ -678,9 +681,9 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
                   .granularity(Granularities.ALL)
                   .aggregators(
                       ImmutableList.of(
-                          new VarianceAggregatorFactory("a0:agg", "var1", "sample", "variance"),
-                          new VarianceAggregatorFactory("a1:agg", "var1", "population", "variance"),
-                          new VarianceAggregatorFactory("a2:agg", "var1", "sample", "variance"),
+                          new VarianceAggregatorFactory("a0", "var1", "sample", "variance"),
+                          new VarianceAggregatorFactory("a1", "var1", "population", "variance"),
+                          new VarianceAggregatorFactory("a2", "var1", "sample", "variance"),
                           new VarianceAggregatorFactory("a3:agg", "var1", "sample", "variance"),
                           new VarianceAggregatorFactory("a4:agg", "var1", "population", "variance"),
                           new VarianceAggregatorFactory("a5:agg", "var1", "sample", "variance")
@@ -698,4 +701,28 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
         expectedResults
     );
   }
+
+  @Test
+  public void testOverWindow()
+  {
+    testBuilder()
+        .sql(
+            "select dim4, dim5, mod(m1, 3), var_pop(mod(m1, 3)) over (partition by dim4 order by dim5) c\n"
+            + "from numfoo\n"
+            + "group by dim4, dim5, mod(m1, 3)")
+        .queryContext(ImmutableMap.of(
+            PlannerContext.CTX_ENABLE_WINDOW_FNS, true,
+            QueryContexts.ENABLE_DEBUG, true,
+            QueryContexts.WINDOWING_STRICT_VALIDATION, false
+        ))
+        .expectedResults(ImmutableList.of(
+            new Object[]{"a", "aa", 1.0D, 0.0D},
+            new Object[]{"a", "ab", 2.0D, 0.25D},
+            new Object[]{"a", "ba", 0.0D, 0.6666666666666666D},
+            new Object[]{"b", "aa", 2.0D, 0.0D},
+            new Object[]{"b", "ab", 0.0D, 1.0D},
+            new Object[]{"b", "ad", 1.0D, 0.6666666666666666D}
+        ))
+        .run();
+  }
 }

From 197c54f673f29a2cd0eb5d8af7469f14737060e6 Mon Sep 17 00:00:00 2001
From: Vishesh Garg <gargvishesh@gmail.com>
Date: Fri, 12 Jul 2024 16:40:20 +0530
Subject: [PATCH 62/72] Auto-Compaction using Multi-Stage Query Engine (#16291)

Description:
Compaction operations issued by the Coordinator currently run using the native query engine.
As majority of the advancements that we are making in batch ingestion are in MSQ, it is imperative
that we support compaction on MSQ to make Compaction more robust and possibly faster.
For instance, we have seen OOM errors in native compaction that MSQ could have handled by its
auto-calculation of tuning parameters.

This commit enables compaction on MSQ to remove the dependency on native engine.

Main changes:
* `DataSourceCompactionConfig` now has an additional field `engine` that can be one of
`[native, msq]` with `native` being the default.
*  if engine is MSQ, `CompactSegments` duty assigns all available compaction task slots to the
launched `CompactionTask` to ensure full capacity is available to MSQ. This is to avoid stalling which
could happen in case a fraction of the tasks were allotted and they eventually fell short of the number
of tasks required by the MSQ engine to run the compaction.
* `ClientCompactionTaskQuery` has a new field `compactionRunner` with just one `engine` field.
* `CompactionTask` now has `CompactionRunner` interface instance with its implementations
`NativeCompactinRunner` and `MSQCompactionRunner` in the `druid-multi-stage-query` extension.
The objectmapper deserializes `ClientCompactionRunnerInfo` in `ClientCompactionTaskQuery` to the
`CompactionRunner` instance that is mapped to the specified type [`native`, `msq`].
* `CompactTask` uses the `CompactionRunner` instance it receives to create the indexing tasks.
* `CompactionTask` to `MSQControllerTask` conversion logic checks whether metrics are present in
the segment schema. If present, the task is created with a native group-by query; if not, the task is
issued with a scan query. The `storeCompactionState` flag is set in the context.
* Each created `MSQControllerTask` is launched in-place and its `TaskStatus` tracked to determine the
final status of the `CompactionTask`. The id of each of these tasks is the same as that of `CompactionTask`
since otherwise, the workers will be unable to determine the controller task's location for communication
(as they haven't been launched via the overlord).
---
 .../NewestSegmentFirstPolicyBenchmark.java    |   1 +
 .../apache/druid/msq/exec/ControllerImpl.java |  15 +-
 .../druid/msq/guice/MSQIndexingModule.java    |   4 +
 .../msq/indexing/MSQCompactionRunner.java     | 524 ++++++++++++++++++
 .../druid/msq/indexing/MSQControllerTask.java |  16 +
 .../msq/util/MultiStageQueryContext.java      |   4 +-
 .../apache/druid/msq/exec/MSQReplaceTest.java |  56 +-
 .../msq/indexing/MSQCompactionRunnerTest.java | 445 +++++++++++++++
 .../common/task/CompactionRunner.java         |  62 +++
 .../indexing/common/task/CompactionTask.java  | 291 ++--------
 .../common/task/NativeCompactionRunner.java   | 333 +++++++++++
 .../ClientCompactionTaskQuerySerdeTest.java   |   5 +-
 .../common/task/CompactionTaskTest.java       | 270 ++++++---
 .../docker/environment-configs/common         |   2 +-
 .../druid/testing/utils/CompactionUtil.java   |   1 +
 .../duty/ITAutoCompactionTest.java            | 205 ++++++-
 .../duty/ITAutoCompactionUpgradeTest.java     |   1 +
 .../druid/indexer/CompactionEngine.java       |  49 ++
 .../partitions/SecondaryPartitionType.java    |   4 +-
 .../druid/indexer/CompactionEngineTest.java   |  43 ++
 .../indexing/ClientCompactionRunnerInfo.java  | 216 ++++++++
 .../ClientCompactionTaskGranularitySpec.java  |  10 +-
 .../indexing/ClientCompactionTaskQuery.java   |  19 +-
 .../client/indexing/ClientMSQContext.java     |  35 ++
 .../CompactionConfigValidationResult.java     |  44 ++
 .../CoordinatorCompactionConfig.java          |  46 +-
 .../DataSourceCompactionConfig.java           |  15 +-
 .../coordinator/duty/CompactSegments.java     |  85 ++-
 .../CoordinatorCompactionConfigsResource.java |  18 +-
 .../ClientCompactionRunnerInfoTest.java       | 246 ++++++++
 .../DataSourceCompactionConfigTest.java       |  18 +
 .../NewestSegmentFirstIteratorTest.java       |   9 +
 .../compact/NewestSegmentFirstPolicyTest.java |   1 +
 .../coordinator/duty/CompactSegmentsTest.java | 154 +++--
 .../duty/KillCompactionConfigTest.java        |   3 +
 ...rdinatorCompactionConfigsResourceTest.java | 106 ++++
 .../sql/calcite/parser/DruidSqlInsert.java    |   1 +
 37 files changed, 2891 insertions(+), 466 deletions(-)
 create mode 100644 extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQCompactionRunner.java
 create mode 100644 extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java
 create mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionRunner.java
 create mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/task/NativeCompactionRunner.java
 create mode 100644 processing/src/main/java/org/apache/druid/indexer/CompactionEngine.java
 create mode 100644 processing/src/test/java/org/apache/druid/indexer/CompactionEngineTest.java
 create mode 100644 server/src/main/java/org/apache/druid/client/indexing/ClientCompactionRunnerInfo.java
 create mode 100644 server/src/main/java/org/apache/druid/client/indexing/ClientMSQContext.java
 create mode 100644 server/src/main/java/org/apache/druid/server/coordinator/CompactionConfigValidationResult.java
 create mode 100644 server/src/test/java/org/apache/druid/client/indexing/ClientCompactionRunnerInfoTest.java

diff --git a/benchmarks/src/test/java/org/apache/druid/server/coordinator/NewestSegmentFirstPolicyBenchmark.java b/benchmarks/src/test/java/org/apache/druid/server/coordinator/NewestSegmentFirstPolicyBenchmark.java
index 52a6e0d9757..37f7b665927 100644
--- a/benchmarks/src/test/java/org/apache/druid/server/coordinator/NewestSegmentFirstPolicyBenchmark.java
+++ b/benchmarks/src/test/java/org/apache/druid/server/coordinator/NewestSegmentFirstPolicyBenchmark.java
@@ -104,6 +104,7 @@ public class NewestSegmentFirstPolicyBenchmark
               null,
               null,
               null,
+              null,
               null
           )
       );
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
index 3ca6d5780de..a30e9686087 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
@@ -193,6 +193,7 @@ import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.realtime.appenderator.SegmentIdWithShardSpec;
 import org.apache.druid.segment.transform.TransformSpec;
 import org.apache.druid.server.DruidNode;
+import org.apache.druid.sql.calcite.parser.DruidSqlInsert;
 import org.apache.druid.sql.calcite.planner.ColumnMappings;
 import org.apache.druid.sql.calcite.rel.DruidQuery;
 import org.apache.druid.sql.http.ResultFormat;
@@ -1557,7 +1558,7 @@ public class ControllerImpl implements Controller
         if (!destination.isReplaceTimeChunks()) {
           // Store compaction state only for replace queries.
           log.warn(
-              "storeCompactionState flag set for a non-REPLACE query [%s]. Ignoring the flag for now.",
+              "Ignoring storeCompactionState flag since it is set for a non-REPLACE query[%s].",
               queryDef.getQueryId()
           );
         } else {
@@ -1657,9 +1658,11 @@ public class ControllerImpl implements Controller
 
     GranularitySpec granularitySpec = new UniformGranularitySpec(
         segmentGranularity,
-        dataSchema.getGranularitySpec().getQueryGranularity(),
+        QueryContext.of(querySpec.getQuery().getContext())
+                    .getGranularity(DruidSqlInsert.SQL_INSERT_QUERY_GRANULARITY, jsonMapper),
         dataSchema.getGranularitySpec().isRollup(),
-        dataSchema.getGranularitySpec().inputIntervals()
+        // Not using dataSchema.getGranularitySpec().inputIntervals() as that always has ETERNITY
+        ((DataSourceMSQDestination) querySpec.getDestination()).getReplaceTimeChunks()
     );
 
     DimensionsSpec dimensionsSpec = dataSchema.getDimensionsSpec();
@@ -1671,9 +1674,9 @@ public class ControllerImpl implements Controller
     List<Object> metricsSpec = dataSchema.getAggregators() == null
                                ? null
                                : jsonMapper.convertValue(
-                                   dataSchema.getAggregators(), new TypeReference<List<Object>>()
-                                   {
-                                   });
+                                   dataSchema.getAggregators(),
+                                   new TypeReference<List<Object>>() {}
+                               );
 
 
     IndexSpec indexSpec = tuningConfig.getIndexSpec();
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQIndexingModule.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQIndexingModule.java
index c64c893e5cd..01a8743dd86 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQIndexingModule.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQIndexingModule.java
@@ -20,6 +20,7 @@
 package org.apache.druid.msq.guice;
 
 import com.fasterxml.jackson.databind.Module;
+import com.fasterxml.jackson.databind.jsontype.NamedType;
 import com.fasterxml.jackson.databind.module.SimpleModule;
 import com.google.common.collect.ImmutableList;
 import com.google.inject.Binder;
@@ -29,6 +30,7 @@ import org.apache.druid.msq.counters.CounterSnapshotsSerializer;
 import org.apache.druid.msq.counters.SegmentGenerationProgressCounter;
 import org.apache.druid.msq.counters.SuperSorterProgressTrackerCounter;
 import org.apache.druid.msq.counters.WarningCounters;
+import org.apache.druid.msq.indexing.MSQCompactionRunner;
 import org.apache.druid.msq.indexing.MSQControllerTask;
 import org.apache.druid.msq.indexing.MSQWorkerTask;
 import org.apache.druid.msq.indexing.error.BroadcastTablesTooLargeFault;
@@ -192,6 +194,8 @@ public class MSQIndexingModule implements DruidModule
         NilInputSource.class
     );
 
+    module.registerSubtypes(new NamedType(MSQCompactionRunner.class, MSQCompactionRunner.TYPE));
+
     FAULT_CLASSES.forEach(module::registerSubtypes);
     module.addSerializer(new CounterSnapshotsSerializer());
     return Collections.singletonList(module);
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQCompactionRunner.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQCompactionRunner.java
new file mode 100644
index 00000000000..ac43e7c864b
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQCompactionRunner.java
@@ -0,0 +1,524 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.indexing;
+
+import com.fasterxml.jackson.annotation.JacksonInject;
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonIgnore;
+import com.fasterxml.jackson.core.JsonProcessingException;
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.collect.ImmutableList;
+import com.google.inject.Injector;
+import org.apache.druid.client.indexing.ClientCompactionRunnerInfo;
+import org.apache.druid.data.input.impl.DimensionSchema;
+import org.apache.druid.indexer.TaskStatus;
+import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
+import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
+import org.apache.druid.indexer.partitions.PartitionsSpec;
+import org.apache.druid.indexer.partitions.SecondaryPartitionType;
+import org.apache.druid.indexing.common.TaskToolbox;
+import org.apache.druid.indexing.common.task.CompactionRunner;
+import org.apache.druid.indexing.common.task.CompactionTask;
+import org.apache.druid.indexing.common.task.CurrentSubTaskHolder;
+import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.java.util.common.granularity.AllGranularity;
+import org.apache.druid.java.util.common.granularity.Granularities;
+import org.apache.druid.java.util.common.granularity.Granularity;
+import org.apache.druid.java.util.common.granularity.PeriodGranularity;
+import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.math.expr.ExprMacroTable;
+import org.apache.druid.msq.indexing.destination.DataSourceMSQDestination;
+import org.apache.druid.msq.util.MultiStageQueryContext;
+import org.apache.druid.query.Druids;
+import org.apache.druid.query.Query;
+import org.apache.druid.query.QueryContext;
+import org.apache.druid.query.TableDataSource;
+import org.apache.druid.query.dimension.DefaultDimensionSpec;
+import org.apache.druid.query.dimension.DimensionSpec;
+import org.apache.druid.query.expression.TimestampFloorExprMacro;
+import org.apache.druid.query.expression.TimestampParseExprMacro;
+import org.apache.druid.query.filter.DimFilter;
+import org.apache.druid.query.groupby.GroupByQuery;
+import org.apache.druid.query.groupby.GroupByQueryConfig;
+import org.apache.druid.query.groupby.orderby.OrderByColumnSpec;
+import org.apache.druid.query.spec.MultipleIntervalSegmentSpec;
+import org.apache.druid.segment.VirtualColumns;
+import org.apache.druid.segment.column.ColumnHolder;
+import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.column.RowSignature;
+import org.apache.druid.segment.indexing.DataSchema;
+import org.apache.druid.segment.virtual.ExpressionVirtualColumn;
+import org.apache.druid.server.coordinator.CompactionConfigValidationResult;
+import org.apache.druid.sql.calcite.parser.DruidSqlInsert;
+import org.apache.druid.sql.calcite.planner.ColumnMapping;
+import org.apache.druid.sql.calcite.planner.ColumnMappings;
+import org.joda.time.Interval;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.Objects;
+import java.util.stream.Collectors;
+
+public class MSQCompactionRunner implements CompactionRunner
+{
+  private static final Logger log = new Logger(MSQCompactionRunner.class);
+  public static final String TYPE = "msq";
+  private static final Granularity DEFAULT_SEGMENT_GRANULARITY = Granularities.ALL;
+
+  private final ObjectMapper jsonMapper;
+  private final Injector injector;
+  // Needed as output column name while grouping in the scenario of:
+  // a) no query granularity -- to specify an output name for the time dimension column since __time is a reserved name.
+  // b) custom query granularity -- to create a virtual column containing the rounded-off row timestamp.
+  // In both cases, the new column is converted back to __time later using columnMappings.
+  public static final String TIME_VIRTUAL_COLUMN = "__vTime";
+
+  @JsonIgnore
+  private final CurrentSubTaskHolder currentSubTaskHolder = new CurrentSubTaskHolder(
+      (taskObject, config) -> {
+        final MSQControllerTask msqControllerTask = (MSQControllerTask) taskObject;
+        msqControllerTask.stopGracefully(config);
+      });
+
+
+  @JsonCreator
+  public MSQCompactionRunner(@JacksonInject ObjectMapper jsonMapper, @JacksonInject Injector injector)
+  {
+    this.jsonMapper = jsonMapper;
+    this.injector = injector;
+  }
+
+  /**
+   * Checks if the provided compaction config is supported by MSQ. The same validation is done at
+   * {@link ClientCompactionRunnerInfo#compactionConfigSupportedByMSQEngine}
+   * The following configs aren't supported:
+   * <ul>
+   * <li>partitionsSpec of type HashedParititionsSpec.</li>
+   * <li>maxTotalRows in DynamicPartitionsSpec.</li>
+   * <li>rollup set to false in granularitySpec when metricsSpec is specified. Null is treated as true.</li>
+   * <li>queryGranularity set to ALL in granularitySpec.</li>
+   * <li>Each metric has output column name same as the input name.</li>
+   * </ul>
+   */
+  @Override
+  public CompactionConfigValidationResult validateCompactionTask(
+      CompactionTask compactionTask
+  )
+  {
+    List<CompactionConfigValidationResult> validationResults = new ArrayList<>();
+    if (compactionTask.getTuningConfig() != null) {
+      validationResults.add(ClientCompactionRunnerInfo.validatePartitionsSpecForMSQ(
+          compactionTask.getTuningConfig().getPartitionsSpec())
+      );
+    }
+    if (compactionTask.getGranularitySpec() != null) {
+      validationResults.add(ClientCompactionRunnerInfo.validateRollupForMSQ(
+          compactionTask.getMetricsSpec(),
+          compactionTask.getGranularitySpec().isRollup()
+      ));
+    }
+    validationResults.add(ClientCompactionRunnerInfo.validateMaxNumTasksForMSQ(compactionTask.getContext()));
+    validationResults.add(ClientCompactionRunnerInfo.validateMetricsSpecForMSQ(compactionTask.getMetricsSpec()));
+    return validationResults.stream()
+                            .filter(result -> !result.isValid())
+                            .findFirst()
+                            .orElse(new CompactionConfigValidationResult(true, null));
+  }
+
+  @Override
+  public CurrentSubTaskHolder getCurrentSubTaskHolder()
+  {
+    return currentSubTaskHolder;
+  }
+
+  @Override
+  public TaskStatus runCompactionTasks(
+      CompactionTask compactionTask,
+      Map<Interval, DataSchema> intervalDataSchemas,
+      TaskToolbox taskToolbox
+  ) throws Exception
+  {
+    List<MSQControllerTask> msqControllerTasks = createMsqControllerTasks(compactionTask, intervalDataSchemas);
+
+    if (msqControllerTasks.isEmpty()) {
+      String msg = StringUtils.format(
+          "Can't find segments from inputSpec[%s], nothing to do.",
+          compactionTask.getIoConfig().getInputSpec()
+      );
+      return TaskStatus.failure(compactionTask.getId(), msg);
+    }
+    return runSubtasks(
+        msqControllerTasks,
+        taskToolbox,
+        currentSubTaskHolder,
+        compactionTask.getId()
+    );
+  }
+
+  public List<MSQControllerTask> createMsqControllerTasks(
+      CompactionTask compactionTask,
+      Map<Interval, DataSchema> intervalDataSchemas
+  ) throws JsonProcessingException
+  {
+    final List<MSQControllerTask> msqControllerTasks = new ArrayList<>();
+
+    for (Map.Entry<Interval, DataSchema> intervalDataSchema : intervalDataSchemas.entrySet()) {
+      Query<?> query;
+      Interval interval = intervalDataSchema.getKey();
+      DataSchema dataSchema = intervalDataSchema.getValue();
+
+      if (isGroupBy(dataSchema)) {
+        query = buildGroupByQuery(compactionTask, interval, dataSchema);
+      } else {
+        query = buildScanQuery(compactionTask, interval, dataSchema);
+      }
+      QueryContext compactionTaskContext = new QueryContext(compactionTask.getContext());
+
+      MSQSpec msqSpec = MSQSpec.builder()
+                               .query(query)
+                               .columnMappings(getColumnMappings(dataSchema))
+                               .destination(buildMSQDestination(compactionTask, dataSchema))
+                               .assignmentStrategy(MultiStageQueryContext.getAssignmentStrategy(compactionTaskContext))
+                               .tuningConfig(buildMSQTuningConfig(compactionTask, compactionTaskContext))
+                               .build();
+
+      Map<String, Object> msqControllerTaskContext = createMSQTaskContext(compactionTask, dataSchema);
+
+      MSQControllerTask controllerTask = new MSQControllerTask(
+          compactionTask.getId(),
+          msqSpec.withOverriddenContext(msqControllerTaskContext),
+          null,
+          msqControllerTaskContext,
+          null,
+          null,
+          null,
+          msqControllerTaskContext,
+          injector
+      );
+      msqControllerTasks.add(controllerTask);
+    }
+    return msqControllerTasks;
+  }
+
+  private static DataSourceMSQDestination buildMSQDestination(
+      CompactionTask compactionTask,
+      DataSchema dataSchema
+  )
+  {
+    final Interval replaceInterval = compactionTask.getIoConfig()
+                                                   .getInputSpec()
+                                                   .findInterval(compactionTask.getDataSource());
+
+    return new DataSourceMSQDestination(
+        dataSchema.getDataSource(),
+        dataSchema.getGranularitySpec().getSegmentGranularity(),
+        null,
+        ImmutableList.of(replaceInterval)
+    );
+  }
+
+  private static MSQTuningConfig buildMSQTuningConfig(CompactionTask compactionTask, QueryContext compactionTaskContext)
+  {
+    // Transfer MSQ-related context params, if any, from the compaction context itself.
+
+    final int maxNumTasks = MultiStageQueryContext.getMaxNumTasks(compactionTaskContext);
+
+    // This parameter is used internally for the number of worker tasks only, so we subtract 1
+    final int maxNumWorkers = maxNumTasks - 1;
+
+    // We don't consider maxRowsInMemory coming via CompactionTuningConfig since it always sets a default value if no
+    // value specified by user.
+    final int maxRowsInMemory = MultiStageQueryContext.getRowsInMemory(compactionTaskContext);
+    final Integer maxNumSegments = MultiStageQueryContext.getMaxNumSegments(compactionTaskContext);
+
+    Integer rowsPerSegment = getRowsPerSegment(compactionTask);
+
+    return new MSQTuningConfig(
+        maxNumWorkers,
+        maxRowsInMemory,
+        rowsPerSegment,
+        maxNumSegments,
+        compactionTask.getTuningConfig() != null ? compactionTask.getTuningConfig().getIndexSpec() : null
+    );
+  }
+
+  private static Integer getRowsPerSegment(CompactionTask compactionTask)
+  {
+    Integer rowsPerSegment = PartitionsSpec.DEFAULT_MAX_ROWS_PER_SEGMENT;
+    if (compactionTask.getTuningConfig() != null) {
+      PartitionsSpec partitionsSpec = compactionTask.getTuningConfig().getPartitionsSpec();
+      if (partitionsSpec instanceof DynamicPartitionsSpec) {
+        rowsPerSegment = partitionsSpec.getMaxRowsPerSegment();
+      } else if (partitionsSpec instanceof DimensionRangePartitionsSpec) {
+        DimensionRangePartitionsSpec dimensionRangePartitionsSpec = (DimensionRangePartitionsSpec) partitionsSpec;
+        rowsPerSegment = dimensionRangePartitionsSpec.getTargetRowsPerSegment() != null
+                         ? dimensionRangePartitionsSpec.getTargetRowsPerSegment()
+                         : dimensionRangePartitionsSpec.getMaxRowsPerSegment();
+      }
+    }
+    return rowsPerSegment;
+  }
+
+  private static RowSignature getRowSignature(DataSchema dataSchema)
+  {
+    RowSignature.Builder rowSignatureBuilder = RowSignature.builder();
+    rowSignatureBuilder.add(dataSchema.getTimestampSpec().getTimestampColumn(), ColumnType.LONG);
+    if (!isQueryGranularityEmptyOrNone(dataSchema)) {
+      // A virtual column for query granularity would have been added. Add corresponding column type.
+      rowSignatureBuilder.add(TIME_VIRTUAL_COLUMN, ColumnType.LONG);
+    }
+    for (DimensionSchema dimensionSchema : dataSchema.getDimensionsSpec().getDimensions()) {
+      rowSignatureBuilder.add(dimensionSchema.getName(), ColumnType.fromString(dimensionSchema.getTypeName()));
+    }
+    return rowSignatureBuilder.build();
+  }
+
+  private static List<DimensionSpec> getAggregateDimensions(DataSchema dataSchema)
+  {
+    List<DimensionSpec> dimensionSpecs = new ArrayList<>();
+
+    if (isQueryGranularityEmptyOrNone(dataSchema)) {
+      // Dimensions in group-by aren't allowed to have time column name as the output name.
+      dimensionSpecs.add(new DefaultDimensionSpec(ColumnHolder.TIME_COLUMN_NAME, TIME_VIRTUAL_COLUMN, ColumnType.LONG));
+    } else {
+      // The changed granularity would result in a new virtual column that needs to be aggregated upon.
+      dimensionSpecs.add(new DefaultDimensionSpec(TIME_VIRTUAL_COLUMN, TIME_VIRTUAL_COLUMN, ColumnType.LONG));
+    }
+
+    dimensionSpecs.addAll(dataSchema.getDimensionsSpec().getDimensions().stream()
+                                    .map(dim -> new DefaultDimensionSpec(
+                                        dim.getName(),
+                                        dim.getName(),
+                                        dim.getColumnType()
+                                    ))
+                                    .collect(Collectors.toList()));
+    return dimensionSpecs;
+  }
+
+  private static ColumnMappings getColumnMappings(DataSchema dataSchema)
+  {
+    List<ColumnMapping> columnMappings = dataSchema.getDimensionsSpec()
+                                                   .getDimensions()
+                                                   .stream()
+                                                   .map(dim -> new ColumnMapping(
+                                                       dim.getName(), dim.getName()))
+                                                   .collect(Collectors.toList());
+    columnMappings.addAll(Arrays.stream(dataSchema.getAggregators())
+                                .map(agg -> new ColumnMapping(agg.getName(), agg.getName()))
+                                .collect(
+                                    Collectors.toList()));
+    if (isGroupBy(dataSchema) || !isQueryGranularityEmptyOrNone(dataSchema)) {
+      // For scan queries, a virtual column is created from __time if a custom query granularity is provided. For
+      // group-by queries, as insert needs __time, it will always be one of the dimensions. Since dimensions in groupby
+      // aren't allowed to have time column as the output name, we map time dimension to TIME_VIRTUAL_COLUMN in
+      // dimensions, and map it back to the time column here.
+      columnMappings.add(new ColumnMapping(TIME_VIRTUAL_COLUMN, ColumnHolder.TIME_COLUMN_NAME));
+    } else {
+      columnMappings.add(new ColumnMapping(ColumnHolder.TIME_COLUMN_NAME, ColumnHolder.TIME_COLUMN_NAME));
+    }
+    return new ColumnMappings(columnMappings);
+  }
+
+  private static List<OrderByColumnSpec> getOrderBySpec(PartitionsSpec partitionSpec)
+  {
+    if (partitionSpec.getType() == SecondaryPartitionType.RANGE) {
+      List<String> dimensions = ((DimensionRangePartitionsSpec) partitionSpec).getPartitionDimensions();
+      return dimensions.stream()
+                       .map(dim -> new OrderByColumnSpec(dim, OrderByColumnSpec.Direction.ASCENDING))
+                       .collect(Collectors.toList());
+    }
+    return Collections.emptyList();
+  }
+
+  private static Query<?> buildScanQuery(CompactionTask compactionTask, Interval interval, DataSchema dataSchema)
+  {
+    RowSignature rowSignature = getRowSignature(dataSchema);
+    return new Druids.ScanQueryBuilder().dataSource(dataSchema.getDataSource())
+                                        .columns(rowSignature.getColumnNames())
+                                        .virtualColumns(getVirtualColumns(dataSchema, interval))
+                                        .columnTypes(rowSignature.getColumnTypes())
+                                        .intervals(new MultipleIntervalSegmentSpec(Collections.singletonList(interval)))
+                                        .legacy(false)
+                                        .filters(dataSchema.getTransformSpec().getFilter())
+                                        .context(compactionTask.getContext())
+                                        .build();
+  }
+
+  private static boolean isGroupBy(DataSchema dataSchema)
+  {
+    if (dataSchema.getGranularitySpec() != null) {
+      // If rollup is true without any metrics, all columns are treated as dimensions and
+      // duplicate rows are removed in line with native compaction.
+      return dataSchema.getGranularitySpec().isRollup();
+    }
+    // If no rollup specified, decide based on whether metrics are present.
+    return dataSchema.getAggregators().length > 0;
+  }
+
+  private static boolean isQueryGranularityEmptyOrNone(DataSchema dataSchema)
+  {
+    return dataSchema.getGranularitySpec() == null
+           || dataSchema.getGranularitySpec().getQueryGranularity() == null
+           || Objects.equals(
+        dataSchema.getGranularitySpec().getQueryGranularity(),
+        Granularities.NONE
+    );
+  }
+
+  /**
+   * Creates a virtual timestamp column to create a new __time field according to the provided queryGranularity, as
+   * queryGranularity field itself is mandated to be ALL in MSQControllerTask.
+   */
+  private static VirtualColumns getVirtualColumns(DataSchema dataSchema, Interval interval)
+  {
+    if (isQueryGranularityEmptyOrNone(dataSchema)) {
+      return VirtualColumns.EMPTY;
+    }
+    String virtualColumnExpr;
+    if (dataSchema.getGranularitySpec()
+                  .getQueryGranularity()
+                  .equals(Granularities.ALL)) {
+      // For ALL query granularity, all records in a segment are assigned the interval start timestamp of the segment.
+      // It's the same behaviour in native compaction.
+      virtualColumnExpr = StringUtils.format("timestamp_parse('%s')", interval.getStart());
+    } else {
+      PeriodGranularity periodQueryGranularity = (PeriodGranularity) dataSchema.getGranularitySpec()
+                                                                               .getQueryGranularity();
+      // Round of the __time column according to the required granularity.
+      virtualColumnExpr =
+          StringUtils.format(
+              "timestamp_floor(\"%s\", '%s')",
+              ColumnHolder.TIME_COLUMN_NAME,
+              periodQueryGranularity.getPeriod().toString()
+          );
+    }
+    return VirtualColumns.create(new ExpressionVirtualColumn(
+        TIME_VIRTUAL_COLUMN,
+        virtualColumnExpr,
+        ColumnType.LONG,
+        new ExprMacroTable(ImmutableList.of(new TimestampFloorExprMacro(), new TimestampParseExprMacro()))
+    ));
+  }
+
+  private static Query<?> buildGroupByQuery(CompactionTask compactionTask, Interval interval, DataSchema dataSchema)
+  {
+    DimFilter dimFilter = dataSchema.getTransformSpec().getFilter();
+
+    GroupByQuery.Builder builder = new GroupByQuery.Builder()
+        .setDataSource(new TableDataSource(compactionTask.getDataSource()))
+        .setVirtualColumns(getVirtualColumns(dataSchema, interval))
+        .setDimFilter(dimFilter)
+        .setGranularity(new AllGranularity())
+        .setDimensions(getAggregateDimensions(dataSchema))
+        .setAggregatorSpecs(Arrays.asList(dataSchema.getAggregators()))
+        .setContext(compactionTask.getContext())
+        .setInterval(interval);
+
+    if (compactionTask.getTuningConfig() != null && compactionTask.getTuningConfig().getPartitionsSpec() != null) {
+      getOrderBySpec(compactionTask.getTuningConfig().getPartitionsSpec()).forEach(builder::addOrderByColumn);
+    }
+    return builder.build();
+  }
+
+  private String serializeGranularity(Granularity granularity, ObjectMapper jsonMapper) throws JsonProcessingException
+  {
+    if (granularity != null) {
+      // AllGranularity by default gets deserialized into {"type": "all"} since there is no custom serialize impl -- as
+      // is there for PeriodGranularity. Not implementing the serializer itself to avoid things breaking elsewhere.
+      return granularity.equals(Granularities.ALL) ? "ALL" : jsonMapper.writeValueAsString(granularity);
+    }
+    return null;
+  }
+
+  private Map<String, Object> createMSQTaskContext(CompactionTask compactionTask, DataSchema dataSchema)
+      throws JsonProcessingException
+  {
+    Map<String, Object> context = new HashMap<>(compactionTask.getContext());
+    context.put(
+        DruidSqlInsert.SQL_INSERT_SEGMENT_GRANULARITY,
+        serializeGranularity(dataSchema.getGranularitySpec() != null
+                             ? dataSchema.getGranularitySpec()
+                                         .getSegmentGranularity()
+                             : DEFAULT_SEGMENT_GRANULARITY, jsonMapper)
+    );
+    if (!isQueryGranularityEmptyOrNone(dataSchema)) {
+      context.put(
+          DruidSqlInsert.SQL_INSERT_QUERY_GRANULARITY,
+          serializeGranularity(dataSchema.getGranularitySpec().getQueryGranularity(), jsonMapper)
+      );
+    }
+    // Similar to compaction using the native engine, don't finalize aggregations.
+    context.putIfAbsent(MultiStageQueryContext.CTX_FINALIZE_AGGREGATIONS, false);
+    // Only scalar or array-type dimensions are allowed as grouping keys.
+    context.putIfAbsent(GroupByQueryConfig.CTX_KEY_ENABLE_MULTI_VALUE_UNNESTING, false);
+    return context;
+  }
+
+  private static TaskStatus runSubtasks(
+      List<MSQControllerTask> tasks,
+      TaskToolbox toolbox,
+      CurrentSubTaskHolder currentSubTaskHolder,
+      String compactionTaskId
+  ) throws JsonProcessingException
+  {
+    final int totalNumSpecs = tasks.size();
+    log.info("Generated [%d] MSQControllerTask specs", totalNumSpecs);
+
+    int failCnt = 0;
+
+    for (MSQControllerTask eachTask : tasks) {
+      final String json = toolbox.getJsonMapper().writerWithDefaultPrettyPrinter().writeValueAsString(eachTask);
+      if (!currentSubTaskHolder.setTask(eachTask)) {
+        String errMsg = "Task was asked to stop. Finish as failed.";
+        log.info(errMsg);
+        return TaskStatus.failure(compactionTaskId, errMsg);
+      }
+      try {
+        if (eachTask.isReady(toolbox.getTaskActionClient())) {
+          log.info("Running MSQControllerTask: " + json);
+          final TaskStatus eachResult = eachTask.run(toolbox);
+          if (!eachResult.isSuccess()) {
+            failCnt++;
+            log.warn("Failed to run MSQControllerTask: [%s].\nTrying the next MSQControllerTask.", json);
+          }
+        } else {
+          failCnt++;
+          log.warn("MSQControllerTask is not ready: [%s].\nTrying the next MSQControllerTask.", json);
+        }
+      }
+      catch (Exception e) {
+        failCnt++;
+        log.warn(e, "Failed to run MSQControllerTask: [%s].\nTrying the next MSQControllerTask.", json);
+      }
+    }
+    String msg = StringUtils.format(
+        "Ran [%d] MSQControllerTasks, [%d] succeeded, [%d] failed",
+        totalNumSpecs,
+        totalNumSpecs - failCnt,
+        failCnt
+    );
+    log.info(msg);
+    return failCnt == 0 ? TaskStatus.success(compactionTaskId) : TaskStatus.failure(compactionTaskId, msg);
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQControllerTask.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQControllerTask.java
index b9c8ebe3b80..c3f6feaab24 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQControllerTask.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/MSQControllerTask.java
@@ -144,6 +144,22 @@ public class MSQControllerTask extends AbstractTask implements ClientTaskQuery,
     addToContext(Tasks.FORCE_TIME_CHUNK_LOCK_KEY, true);
   }
 
+  public MSQControllerTask(
+      @Nullable String id,
+      MSQSpec querySpec,
+      @Nullable String sqlQuery,
+      @Nullable Map<String, Object> sqlQueryContext,
+      @Nullable SqlResults.Context sqlResultsContext,
+      @Nullable List<SqlTypeName> sqlTypeNames,
+      @Nullable List<ColumnType> nativeTypeNames,
+      @Nullable Map<String, Object> context,
+      Injector injector
+  )
+  {
+    this(id, querySpec, sqlQuery, sqlQueryContext, sqlResultsContext, sqlTypeNames, nativeTypeNames, context);
+    this.injector = injector;
+  }
+
   @Override
   public String getType()
   {
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
index f8bdb36bfae..cbf9a1a905f 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
@@ -100,6 +100,8 @@ public class MultiStageQueryContext
   public static final String CTX_MSQ_MODE = "mode";
   public static final String DEFAULT_MSQ_MODE = MSQMode.STRICT_MODE.toString();
 
+  // Note: CTX_MAX_NUM_TASKS and DEFAULT_MAX_NUM_TASKS values used here should be kept in sync with those in
+  // org.apache.druid.client.indexing.ClientMsqContext
   public static final String CTX_MAX_NUM_TASKS = "maxNumTasks";
   @VisibleForTesting
   static final int DEFAULT_MAX_NUM_TASKS = 2;
@@ -145,7 +147,7 @@ public class MultiStageQueryContext
   public static final String CTX_ROWS_IN_MEMORY = "rowsInMemory";
   // Lower than the default to minimize the impact of per-row overheads that are not accounted for by
   // OnheapIncrementalIndex. For example: overheads related to creating bitmaps during persist.
-  static final int DEFAULT_ROWS_IN_MEMORY = 100000;
+  public static final int DEFAULT_ROWS_IN_MEMORY = 100000;
 
   public static final String CTX_IS_REINDEX = "isReindex";
 
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
index 2e05d447910..f6eb80b3282 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
@@ -186,7 +186,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.DAY
+                             GranularityType.DAY,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -244,7 +245,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.DAY
+                             GranularityType.DAY,
+                             Intervals.of("2000-01-02T/P1D")
                          )
                      )
                      .verifyResults();
@@ -334,7 +336,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new LongDimensionSchema("cnt")),
-                             GranularityType.HOUR
+                             GranularityType.HOUR,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -409,7 +412,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new StringDimensionSchema("user")),
-                             GranularityType.HOUR
+                             GranularityType.HOUR,
+                             Intervals.of("2016-06-27T01:00:00.000Z/2016-06-27T02:00:00.000Z")
                          )
                      )
                      .verifyResults();
@@ -490,7 +494,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.ALL
+                             GranularityType.ALL,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -582,7 +587,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.MONTH
+                             GranularityType.MONTH,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -664,7 +670,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.MONTH
+                             GranularityType.MONTH,
+                             Intervals.of("2000-01-01T/2000-03-01T")
                          )
                      )
                      .verifyResults();
@@ -749,7 +756,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.MONTH
+                             GranularityType.MONTH,
+                             Intervals.of("2000-01-01T/2002-01-01T")
                          )
                      )
                      .verifyResults();
@@ -900,7 +908,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.MONTH
+                             GranularityType.MONTH,
+                             Intervals.of("2000-01-01T/2000-03-01T")
                          )
                      )
                      .verifyResults();
@@ -1009,7 +1018,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.MONTH
+                             GranularityType.MONTH,
+                             Intervals.of("2000-01-01T/2002-01-01T")
                          )
                      )
                      .verifyResults();
@@ -1070,7 +1080,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.MONTH
+                             GranularityType.MONTH,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -1110,7 +1121,8 @@ public class MSQReplaceTest extends MSQTestBase
                                  new StringDimensionSchema("dim1"),
                                  new LongDimensionSchema("cnt")
                              ),
-                             GranularityType.DAY
+                             GranularityType.DAY,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -1190,7 +1202,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("m1")),
-                             GranularityType.ALL
+                             GranularityType.ALL,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -1248,7 +1261,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Arrays.asList(new FloatDimensionSchema("m1"), new DoubleDimensionSchema("m2")),
-                             GranularityType.QUARTER
+                             GranularityType.QUARTER,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -1340,7 +1354,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new StringDimensionSchema("d")),
-                             GranularityType.ALL
+                             GranularityType.ALL,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -1412,7 +1427,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.emptyList(),
                              Collections.singletonList(new FloatDimensionSchema("d")),
-                             GranularityType.ALL
+                             GranularityType.ALL,
+                             Intervals.ETERNITY
                          )
                      )
                      .verifyResults();
@@ -1495,7 +1511,8 @@ public class MSQReplaceTest extends MSQTestBase
                              context,
                              Collections.singletonList("d"),
                              Collections.singletonList(new StringDimensionSchema("d")),
-                             GranularityType.DAY
+                             GranularityType.DAY,
+                             Intervals.of("1999-01-01T00:00:00.000Z/2002-01-01T00:00:00.000Z")
                          )
                      )
                      .verifyResults();
@@ -2022,7 +2039,8 @@ public class MSQReplaceTest extends MSQTestBase
       Map<String, Object> context,
       List<String> partitionDimensions,
       List<DimensionSchema> dimensions,
-      GranularityType segmentGranularity
+      GranularityType segmentGranularity,
+      Interval interval
   )
   {
     if (!context.containsKey(Tasks.STORE_COMPACTION_STATE_KEY)
@@ -2049,7 +2067,7 @@ public class MSQReplaceTest extends MSQTestBase
         segmentGranularity.getDefaultGranularity(),
         GranularityType.NONE.getDefaultGranularity(),
         false,
-        Intervals.ONLY_ETERNITY
+        Collections.singletonList(interval)
     );
     List<Object> metricsSpec = Collections.emptyList();
 
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java
new file mode 100644
index 00000000000..35eca8cfcb4
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java
@@ -0,0 +1,445 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.indexing;
+
+import com.fasterxml.jackson.core.JsonProcessingException;
+import com.fasterxml.jackson.databind.InjectableValues;
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.Iterables;
+import org.apache.druid.client.indexing.ClientCompactionTaskGranularitySpec;
+import org.apache.druid.client.indexing.ClientCompactionTaskTransformSpec;
+import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.data.input.impl.DimensionSchema;
+import org.apache.druid.data.input.impl.DimensionsSpec;
+import org.apache.druid.data.input.impl.LongDimensionSchema;
+import org.apache.druid.data.input.impl.StringDimensionSchema;
+import org.apache.druid.data.input.impl.TimestampSpec;
+import org.apache.druid.indexer.TaskStatus;
+import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
+import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
+import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
+import org.apache.druid.indexer.partitions.PartitionsSpec;
+import org.apache.druid.indexing.common.task.CompactionIntervalSpec;
+import org.apache.druid.indexing.common.task.CompactionTask;
+import org.apache.druid.jackson.DefaultObjectMapper;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.granularity.Granularities;
+import org.apache.druid.java.util.common.granularity.GranularityType;
+import org.apache.druid.math.expr.ExprMacroTable;
+import org.apache.druid.msq.indexing.destination.DataSourceMSQDestination;
+import org.apache.druid.msq.kernel.WorkerAssignmentStrategy;
+import org.apache.druid.msq.util.MultiStageQueryContext;
+import org.apache.druid.query.aggregation.AggregatorFactory;
+import org.apache.druid.query.aggregation.CountAggregatorFactory;
+import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
+import org.apache.druid.query.expression.LookupEnabledTestExprMacroTable;
+import org.apache.druid.query.filter.DimFilter;
+import org.apache.druid.query.filter.SelectorDimFilter;
+import org.apache.druid.segment.IndexSpec;
+import org.apache.druid.segment.data.CompressionFactory;
+import org.apache.druid.segment.data.CompressionStrategy;
+import org.apache.druid.segment.data.RoaringBitmapSerdeFactory;
+import org.apache.druid.segment.indexing.DataSchema;
+import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
+import org.apache.druid.segment.transform.TransformSpec;
+import org.apache.druid.server.coordinator.CompactionConfigValidationResult;
+import org.apache.druid.sql.calcite.parser.DruidSqlInsert;
+import org.joda.time.Interval;
+import org.junit.Assert;
+import org.junit.BeforeClass;
+import org.junit.Test;
+
+import javax.annotation.Nullable;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+
+public class MSQCompactionRunnerTest
+{
+  private static final String DATA_SOURCE = "dataSource";
+  private static final Interval COMPACTION_INTERVAL = Intervals.of("2017-01-01/2017-07-01");
+
+  private static final String TIMESTAMP_COLUMN = "timestamp";
+  private static final int TARGET_ROWS_PER_SEGMENT = 100000;
+  private static final GranularityType SEGMENT_GRANULARITY = GranularityType.HOUR;
+  private static final GranularityType QUERY_GRANULARITY = GranularityType.HOUR;
+  private static List<String> PARTITION_DIMENSIONS;
+
+  private static final StringDimensionSchema DIM1 = new StringDimensionSchema(
+      "string_dim",
+      null,
+      null
+  );
+  private static final LongDimensionSchema LONG_DIMENSION_SCHEMA = new LongDimensionSchema("long_dim");
+  private static final List<DimensionSchema> DIMENSIONS = ImmutableList.of(DIM1, LONG_DIMENSION_SCHEMA);
+  private static final ObjectMapper JSON_MAPPER = new DefaultObjectMapper();
+  private static final AggregatorFactory AGG1 = new CountAggregatorFactory("agg_0");
+  private static final AggregatorFactory AGG2 = new LongSumAggregatorFactory("sum_added", "sum_added");
+  private static final List<AggregatorFactory> AGGREGATORS = ImmutableList.of(AGG1, AGG2);
+  private static final MSQCompactionRunner MSQ_COMPACTION_RUNNER = new MSQCompactionRunner(JSON_MAPPER, null);
+
+  @BeforeClass
+  public static void setupClass()
+  {
+    NullHandling.initializeForTests();
+
+    final StringDimensionSchema stringDimensionSchema = new StringDimensionSchema(
+        "string_dim",
+        null,
+        null
+    );
+
+    PARTITION_DIMENSIONS = Collections.singletonList(stringDimensionSchema.getName());
+
+    JSON_MAPPER.setInjectableValues(new InjectableValues.Std().addValue(
+        ExprMacroTable.class,
+        LookupEnabledTestExprMacroTable.INSTANCE
+    ));
+  }
+
+  @Test
+  public void testHashedPartitionsSpecIsInvalid()
+  {
+    CompactionTask compactionTask = createCompactionTask(
+        new HashedPartitionsSpec(3, null, ImmutableList.of("dummy")),
+        null,
+        Collections.emptyMap(),
+        null,
+        null
+    );
+    Assert.assertFalse(MSQ_COMPACTION_RUNNER.validateCompactionTask(compactionTask).isValid());
+  }
+
+  @Test
+  public void testDimensionRangePartitionsSpecIsValid()
+  {
+    CompactionTask compactionTask = createCompactionTask(
+        new DimensionRangePartitionsSpec(TARGET_ROWS_PER_SEGMENT, null, PARTITION_DIMENSIONS, false),
+        null,
+        Collections.emptyMap(),
+        null,
+        null
+    );
+    Assert.assertTrue(MSQ_COMPACTION_RUNNER.validateCompactionTask(compactionTask).isValid());
+  }
+
+  @Test
+  public void testMaxTotalRowsIsInvalid()
+  {
+    CompactionTask compactionTask = createCompactionTask(
+        new DynamicPartitionsSpec(3, 3L),
+        null,
+        Collections.emptyMap(),
+        null,
+        null
+    );
+    Assert.assertFalse(MSQ_COMPACTION_RUNNER.validateCompactionTask(compactionTask).isValid());
+  }
+
+  @Test
+  public void testDynamicPartitionsSpecIsValid()
+  {
+    CompactionTask compactionTask = createCompactionTask(
+        new DynamicPartitionsSpec(3, null),
+        null,
+        Collections.emptyMap(),
+        null,
+        null
+    );
+    Assert.assertTrue(MSQ_COMPACTION_RUNNER.validateCompactionTask(compactionTask).isValid());
+  }
+
+  @Test
+  public void testQueryGranularityAllIsValid()
+  {
+    CompactionTask compactionTask = createCompactionTask(
+        new DynamicPartitionsSpec(3, null),
+        null,
+        Collections.emptyMap(),
+        new ClientCompactionTaskGranularitySpec(null, Granularities.ALL, null),
+        null
+    );
+    Assert.assertTrue(MSQ_COMPACTION_RUNNER.validateCompactionTask(compactionTask).isValid());
+  }
+
+  @Test
+  public void testRollupFalseWithMetricsSpecIsInValid()
+  {
+    CompactionTask compactionTask = createCompactionTask(
+        new DynamicPartitionsSpec(3, null),
+        null,
+        Collections.emptyMap(),
+        new ClientCompactionTaskGranularitySpec(null, null, false),
+        AGGREGATORS.toArray(new AggregatorFactory[0])
+    );
+    Assert.assertFalse(MSQ_COMPACTION_RUNNER.validateCompactionTask(compactionTask).isValid());
+  }
+
+  @Test
+  public void testMSQEngineWithUnsupportedMetricsSpecIsInValid()
+  {
+    // Aggregators having different input and ouput column names are unsupported.
+    final String inputColName = "added";
+    final String outputColName = "sum_added";
+    CompactionTask compactionTask = createCompactionTask(
+        new DynamicPartitionsSpec(3, null),
+        null,
+        Collections.emptyMap(),
+        new ClientCompactionTaskGranularitySpec(null, null, null),
+        new AggregatorFactory[]{new LongSumAggregatorFactory(outputColName, inputColName)}
+    );
+    CompactionConfigValidationResult validationResult = MSQ_COMPACTION_RUNNER.validateCompactionTask(compactionTask);
+    Assert.assertFalse(validationResult.isValid());
+    Assert.assertEquals(
+        "Different name[sum_added] and fieldName(s)[[added]] for aggregator unsupported for MSQ engine.",
+        validationResult.getReason()
+    );
+  }
+
+  @Test
+  public void testRunCompactionTasksWithEmptyTaskListFails() throws Exception
+  {
+    CompactionTask compactionTask = createCompactionTask(null, null, Collections.emptyMap(), null, null);
+    TaskStatus taskStatus = MSQ_COMPACTION_RUNNER.runCompactionTasks(compactionTask, Collections.emptyMap(), null);
+    Assert.assertTrue(taskStatus.isFailure());
+  }
+
+  @Test
+  public void testMSQControllerTaskSpecWithScanIsValid() throws JsonProcessingException
+  {
+    DimFilter dimFilter = new SelectorDimFilter("dim1", "foo", null);
+
+    CompactionTask taskCreatedWithTransformSpec = createCompactionTask(
+        new DimensionRangePartitionsSpec(TARGET_ROWS_PER_SEGMENT, null, PARTITION_DIMENSIONS, false),
+        dimFilter,
+        Collections.emptyMap(),
+        null,
+        null
+    );
+
+    DataSchema dataSchema = new DataSchema(
+        DATA_SOURCE,
+        new TimestampSpec(TIMESTAMP_COLUMN, null, null),
+        new DimensionsSpec(DIMENSIONS),
+        new AggregatorFactory[]{},
+        new UniformGranularitySpec(
+            SEGMENT_GRANULARITY.getDefaultGranularity(),
+            null,
+            false,
+            Collections.singletonList(COMPACTION_INTERVAL)
+        ),
+        new TransformSpec(dimFilter, Collections.emptyList())
+    );
+
+
+    List<MSQControllerTask> msqControllerTasks = MSQ_COMPACTION_RUNNER.createMsqControllerTasks(
+        taskCreatedWithTransformSpec,
+        Collections.singletonMap(COMPACTION_INTERVAL, dataSchema)
+    );
+
+    MSQControllerTask msqControllerTask = Iterables.getOnlyElement(msqControllerTasks);
+
+    MSQSpec actualMSQSpec = msqControllerTask.getQuerySpec();
+
+    Assert.assertEquals(
+        new MSQTuningConfig(
+            1,
+            MultiStageQueryContext.DEFAULT_ROWS_IN_MEMORY,
+            TARGET_ROWS_PER_SEGMENT,
+            null,
+            createIndexSpec()
+        ),
+        actualMSQSpec.getTuningConfig()
+    );
+    Assert.assertEquals(
+        new DataSourceMSQDestination(
+            DATA_SOURCE,
+            SEGMENT_GRANULARITY.getDefaultGranularity(),
+            null,
+            Collections.singletonList(COMPACTION_INTERVAL)
+        ),
+        actualMSQSpec.getDestination()
+    );
+
+    Assert.assertEquals(dimFilter, actualMSQSpec.getQuery().getFilter());
+    Assert.assertEquals(
+        JSON_MAPPER.writeValueAsString(SEGMENT_GRANULARITY.toString()),
+        msqControllerTask.getContext().get(DruidSqlInsert.SQL_INSERT_SEGMENT_GRANULARITY)
+    );
+    Assert.assertNull(msqControllerTask.getContext().get(DruidSqlInsert.SQL_INSERT_QUERY_GRANULARITY));
+    Assert.assertEquals(WorkerAssignmentStrategy.MAX, actualMSQSpec.getAssignmentStrategy());
+  }
+
+  @Test
+  public void testMSQControllerTaskSpecWithAggregatorsIsValid() throws JsonProcessingException
+  {
+    DimFilter dimFilter = new SelectorDimFilter("dim1", "foo", null);
+
+    CompactionTask taskCreatedWithTransformSpec = createCompactionTask(
+        new DimensionRangePartitionsSpec(TARGET_ROWS_PER_SEGMENT, null, PARTITION_DIMENSIONS, false),
+        dimFilter,
+        Collections.emptyMap(),
+        null,
+        null
+    );
+
+    DataSchema dataSchema = new DataSchema(
+        DATA_SOURCE,
+        new TimestampSpec(TIMESTAMP_COLUMN, null, null),
+        new DimensionsSpec(DIMENSIONS),
+        AGGREGATORS.toArray(new AggregatorFactory[0]),
+        new UniformGranularitySpec(
+            SEGMENT_GRANULARITY.getDefaultGranularity(),
+            QUERY_GRANULARITY.getDefaultGranularity(),
+            Collections.singletonList(COMPACTION_INTERVAL)
+        ),
+        new TransformSpec(dimFilter, Collections.emptyList())
+    );
+
+
+    List<MSQControllerTask> msqControllerTasks = MSQ_COMPACTION_RUNNER.createMsqControllerTasks(
+        taskCreatedWithTransformSpec,
+        Collections.singletonMap(COMPACTION_INTERVAL, dataSchema)
+    );
+
+    MSQControllerTask msqControllerTask = Iterables.getOnlyElement(msqControllerTasks);
+
+    MSQSpec actualMSQSpec = msqControllerTask.getQuerySpec();
+
+    Assert.assertEquals(
+        new MSQTuningConfig(
+            1,
+            MultiStageQueryContext.DEFAULT_ROWS_IN_MEMORY,
+            TARGET_ROWS_PER_SEGMENT,
+            null,
+            createIndexSpec()
+        ),
+        actualMSQSpec.getTuningConfig()
+    );
+    Assert.assertEquals(
+        new DataSourceMSQDestination(
+            DATA_SOURCE,
+            SEGMENT_GRANULARITY.getDefaultGranularity(),
+            null,
+            Collections.singletonList(COMPACTION_INTERVAL)
+        ),
+        actualMSQSpec.getDestination()
+    );
+
+    Assert.assertEquals(dimFilter, actualMSQSpec.getQuery().getFilter());
+    Assert.assertEquals(
+        JSON_MAPPER.writeValueAsString(SEGMENT_GRANULARITY.toString()),
+        msqControllerTask.getContext().get(DruidSqlInsert.SQL_INSERT_SEGMENT_GRANULARITY)
+    );
+    Assert.assertEquals(
+        JSON_MAPPER.writeValueAsString(QUERY_GRANULARITY.toString()),
+        msqControllerTask.getContext().get(DruidSqlInsert.SQL_INSERT_QUERY_GRANULARITY)
+    );
+    Assert.assertEquals(WorkerAssignmentStrategy.MAX, actualMSQSpec.getAssignmentStrategy());
+  }
+
+  private CompactionTask createCompactionTask(
+      @Nullable PartitionsSpec partitionsSpec,
+      @Nullable DimFilter dimFilter,
+      Map<String, Object> contextParams,
+      @Nullable ClientCompactionTaskGranularitySpec granularitySpec,
+      @Nullable AggregatorFactory[] metricsSpec
+  )
+  {
+    ClientCompactionTaskTransformSpec transformSpec =
+        new ClientCompactionTaskTransformSpec(dimFilter);
+    final CompactionTask.Builder builder = new CompactionTask.Builder(
+        DATA_SOURCE,
+        null,
+        null
+    );
+    IndexSpec indexSpec = createIndexSpec();
+
+    Map<String, Object> context = new HashMap<>();
+    context.put(MultiStageQueryContext.CTX_MAX_NUM_TASKS, 2);
+    context.putAll(contextParams);
+
+    builder
+        .inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, null))
+        .tuningConfig(createTuningConfig(
+            indexSpec,
+            partitionsSpec == null ? new DynamicPartitionsSpec(100, null) : partitionsSpec
+        ))
+        .transformSpec(transformSpec)
+        .granularitySpec(granularitySpec)
+        .metricsSpec(metricsSpec)
+        .compactionRunner(new MSQCompactionRunner(JSON_MAPPER, null))
+        .context(context);
+
+    return builder.build();
+  }
+
+  private static CompactionTask.CompactionTuningConfig createTuningConfig(
+      IndexSpec indexSpec,
+      PartitionsSpec partitionsSpec
+  )
+  {
+    return new CompactionTask.CompactionTuningConfig(
+        null,
+        null, // null to compute maxRowsPerSegment automatically
+        null,
+        500000,
+        1000000L,
+        null,
+        null,
+        null,
+        null,
+        partitionsSpec,
+        indexSpec,
+        null,
+        null,
+        !(partitionsSpec instanceof DynamicPartitionsSpec),
+        false,
+        5000L,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null
+    );
+  }
+
+  private static IndexSpec createIndexSpec()
+  {
+    return IndexSpec.builder()
+                    .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                    .withDimensionCompression(CompressionStrategy.LZ4)
+                    .withMetricCompression(CompressionStrategy.LZF)
+                    .withLongEncoding(CompressionFactory.LongEncodingStrategy.LONGS)
+                    .build();
+  }
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionRunner.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionRunner.java
new file mode 100644
index 00000000000..8d30a60d04e
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionRunner.java
@@ -0,0 +1,62 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.task;
+
+import com.fasterxml.jackson.annotation.JsonSubTypes;
+import com.fasterxml.jackson.annotation.JsonTypeInfo;
+import org.apache.druid.client.indexing.ClientCompactionRunnerInfo;
+import org.apache.druid.indexer.TaskStatus;
+import org.apache.druid.indexing.common.TaskToolbox;
+import org.apache.druid.segment.indexing.DataSchema;
+import org.apache.druid.server.coordinator.CompactionConfigValidationResult;
+import org.joda.time.Interval;
+
+import java.util.Map;
+
+/**
+ * Strategy to be used for executing a compaction task.
+ * Should be synchronized with {@link ClientCompactionRunnerInfo}
+ */
+@JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = CompactionRunner.TYPE_PROPERTY)
+@JsonSubTypes(value = {
+    @JsonSubTypes.Type(name = NativeCompactionRunner.TYPE, value = NativeCompactionRunner.class)
+})
+public interface CompactionRunner
+{
+  String TYPE_PROPERTY = "type";
+
+  /**
+   * Creates and runs sub-tasks for the given CompactionTask, one interval at a time.
+   */
+  TaskStatus runCompactionTasks(
+      CompactionTask compactionTask,
+      Map<Interval, DataSchema> intervalDataSchemaMap,
+      TaskToolbox taskToolbox
+  ) throws Exception;
+
+  CurrentSubTaskHolder getCurrentSubTaskHolder();
+
+  /**
+   * Checks if the provided compaction config is supported by the runner.
+   * The same validation is done at {@link org.apache.druid.msq.indexing.MSQCompactionRunner#validateCompactionTask}
+   */
+  CompactionConfigValidationResult validateCompactionTask(CompactionTask compactionTask);
+
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionTask.java
index 81447f3fd5e..fe4d09d8481 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionTask.java
@@ -34,7 +34,6 @@ import com.google.common.collect.ImmutableSet;
 import com.google.common.collect.Iterables;
 import com.google.common.collect.Lists;
 import org.apache.curator.shaded.com.google.common.base.Verify;
-import org.apache.druid.client.coordinator.CoordinatorClient;
 import org.apache.druid.client.indexing.ClientCompactionTaskGranularitySpec;
 import org.apache.druid.client.indexing.ClientCompactionTaskQuery;
 import org.apache.druid.client.indexing.ClientCompactionTaskTransformSpec;
@@ -43,12 +42,11 @@ import org.apache.druid.data.input.SplitHintSpec;
 import org.apache.druid.data.input.impl.DimensionSchema;
 import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.data.input.impl.TimestampSpec;
+import org.apache.druid.error.InvalidInput;
 import org.apache.druid.indexer.Checks;
 import org.apache.druid.indexer.Property;
 import org.apache.druid.indexer.TaskStatus;
-import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.indexer.partitions.PartitionsSpec;
-import org.apache.druid.indexer.report.TaskReport;
 import org.apache.druid.indexing.common.LockGranularity;
 import org.apache.druid.indexing.common.RetryPolicyFactory;
 import org.apache.druid.indexing.common.SegmentCacheManagerFactory;
@@ -56,11 +54,7 @@ import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.actions.RetrieveUsedSegmentsAction;
 import org.apache.druid.indexing.common.actions.TaskActionClient;
 import org.apache.druid.indexing.common.task.IndexTask.IndexTuningConfig;
-import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexIOConfig;
-import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexIngestionSpec;
-import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexSupervisorTask;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexTuningConfig;
-import org.apache.druid.indexing.input.DruidInputSource;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Intervals;
@@ -91,6 +85,7 @@ import org.apache.druid.segment.loading.SegmentCacheManager;
 import org.apache.druid.segment.realtime.appenderator.AppenderatorsManager;
 import org.apache.druid.segment.transform.TransformSpec;
 import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
+import org.apache.druid.server.coordinator.CompactionConfigValidationResult;
 import org.apache.druid.server.coordinator.duty.CompactSegments;
 import org.apache.druid.server.lookup.cache.LookupLoadingSpec;
 import org.apache.druid.server.security.ResourceAction;
@@ -98,7 +93,6 @@ import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.SegmentTimeline;
 import org.apache.druid.timeline.TimelineObjectHolder;
 import org.apache.druid.timeline.VersionedIntervalTimeline;
-import org.apache.druid.utils.CollectionUtils;
 import org.joda.time.Duration;
 import org.joda.time.Interval;
 
@@ -116,7 +110,6 @@ import java.util.HashSet;
 import java.util.List;
 import java.util.Map;
 import java.util.Map.Entry;
-import java.util.Optional;
 import java.util.Set;
 import java.util.TreeMap;
 import java.util.function.Supplier;
@@ -147,8 +140,6 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
    */
   public static final String CTX_KEY_APPENDERATOR_TRACKING_TASK_ID = "appenderatorTrackingTaskId";
 
-  private static final boolean STORE_COMPACTION_STATE = true;
-
   static {
     Verify.verify(TYPE.equals(CompactSegments.COMPACTION_TASK_TYPE));
   }
@@ -164,21 +155,12 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
   private final ClientCompactionTaskGranularitySpec granularitySpec;
   @Nullable
   private final CompactionTuningConfig tuningConfig;
+  @Nullable
+  private final CompactionRunner compactionRunner;
   @JsonIgnore
   private final SegmentProvider segmentProvider;
   @JsonIgnore
-  private final PartitionConfigurationManager partitionConfigurationManager;
-
-  @JsonIgnore
-  private final SegmentCacheManagerFactory segmentCacheManagerFactory;
-
-  @JsonIgnore
-  private final CurrentSubTaskHolder currentSubTaskHolder = new CurrentSubTaskHolder(
-      (taskObject, config) -> {
-        final ParallelIndexSupervisorTask indexTask = (ParallelIndexSupervisorTask) taskObject;
-        indexTask.stopGracefully(config);
-      }
-  );
+  private final CurrentSubTaskHolder currentSubTaskHolder;
 
   @JsonCreator
   public CompactionTask(
@@ -196,6 +178,7 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
       @JsonProperty("granularitySpec") @Nullable final ClientCompactionTaskGranularitySpec granularitySpec,
       @JsonProperty("tuningConfig") @Nullable final TuningConfig tuningConfig,
       @JsonProperty("context") @Nullable final Map<String, Object> context,
+      @JsonProperty("compactionRunner") final CompactionRunner compactionRunner,
       @JacksonInject SegmentCacheManagerFactory segmentCacheManagerFactory
   )
   {
@@ -248,8 +231,12 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
     }
     this.tuningConfig = tuningConfig != null ? getTuningConfig(tuningConfig) : null;
     this.segmentProvider = new SegmentProvider(dataSource, this.ioConfig.getInputSpec());
-    this.partitionConfigurationManager = new PartitionConfigurationManager(this.tuningConfig);
-    this.segmentCacheManagerFactory = segmentCacheManagerFactory;
+    // Note: The default compactionRunnerType used here should match the default runner used in CompactSegments#run
+    // when no runner is detected in the returned compactionTaskQuery.
+    this.compactionRunner = compactionRunner == null
+                            ? new NativeCompactionRunner(segmentCacheManagerFactory)
+                            : compactionRunner;
+    this.currentSubTaskHolder = this.compactionRunner.getCurrentSubTaskHolder();
 
     // Do not load any lookups in sub-tasks launched by compaction task, unless transformSpec is present.
     // If transformSpec is present, we will not modify the context so that the sub-tasks can make the
@@ -397,11 +384,17 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
 
   @Nullable
   @JsonProperty
-  public ParallelIndexTuningConfig getTuningConfig()
+  public CompactionTuningConfig getTuningConfig()
   {
     return tuningConfig;
   }
 
+  @JsonProperty
+  public CompactionRunner getCompactionRunner()
+  {
+    return compactionRunner;
+  }
+
   @Override
   public String getType()
   {
@@ -472,144 +465,44 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
   @Override
   public TaskStatus runTask(TaskToolbox toolbox) throws Exception
   {
-
     // emit metric for compact ingestion mode:
     emitCompactIngestionModeMetrics(toolbox.getEmitter(), ioConfig.isDropExisting());
 
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = createIngestionSchema(
+    final Map<Interval, DataSchema> intervalDataSchemas = createDataSchemasForIntervals(
         UTC_CLOCK,
         toolbox,
         getTaskLockHelper().getLockGranularityToUse(),
-        ioConfig,
         segmentProvider,
-        partitionConfigurationManager,
         dimensionsSpec,
         transformSpec,
         metricsSpec,
         granularitySpec,
-        toolbox.getCoordinatorClient(),
-        segmentCacheManagerFactory,
         getMetricBuilder()
     );
-    final List<ParallelIndexSupervisorTask> indexTaskSpecs = IntStream
-        .range(0, ingestionSpecs.size())
-        .mapToObj(i -> {
-          // The ID of SubtaskSpecs is used as the base sequenceName in segment allocation protocol.
-          // The indexing tasks generated by the compaction task should use different sequenceNames
-          // so that they can allocate valid segment IDs with no duplication.
-          ParallelIndexIngestionSpec ingestionSpec = ingestionSpecs.get(i);
-          final String baseSequenceName = createIndexTaskSpecId(i);
-          return newTask(baseSequenceName, ingestionSpec);
-        })
-        .collect(Collectors.toList());
 
-    if (indexTaskSpecs.isEmpty()) {
-      String msg = StringUtils.format(
-          "Can't find segments from inputSpec[%s], nothing to do.",
-          ioConfig.getInputSpec()
-      );
-      log.warn(msg);
-      return TaskStatus.failure(getId(), msg);
-    } else {
-      registerResourceCloserOnAbnormalExit(currentSubTaskHolder);
-      final int totalNumSpecs = indexTaskSpecs.size();
-      log.info("Generated [%d] compaction task specs", totalNumSpecs);
-
-      int failCnt = 0;
-      final TaskReport.ReportMap completionReports = new TaskReport.ReportMap();
-      for (int i = 0; i < indexTaskSpecs.size(); i++) {
-        ParallelIndexSupervisorTask eachSpec = indexTaskSpecs.get(i);
-        final String json = toolbox.getJsonMapper().writerWithDefaultPrettyPrinter().writeValueAsString(eachSpec);
-        if (!currentSubTaskHolder.setTask(eachSpec)) {
-          String errMsg = "Task was asked to stop. Finish as failed.";
-          log.info(errMsg);
-          return TaskStatus.failure(getId(), errMsg);
-        }
-        try {
-          if (eachSpec.isReady(toolbox.getTaskActionClient())) {
-            log.info("Running indexSpec: " + json);
-            final TaskStatus eachResult = eachSpec.run(toolbox);
-            if (!eachResult.isSuccess()) {
-              failCnt++;
-              log.warn("Failed to run indexSpec: [%s].\nTrying the next indexSpec.", json);
-            }
-
-            String reportKeySuffix = "_" + i;
-            Optional.ofNullable(eachSpec.getCompletionReports()).ifPresent(
-                reports -> completionReports.putAll(
-                    CollectionUtils.mapKeys(reports, key -> key + reportKeySuffix)
-                )
-            );
-          } else {
-            failCnt++;
-            log.warn("indexSpec is not ready: [%s].\nTrying the next indexSpec.", json);
-          }
-        }
-        catch (Exception e) {
-          failCnt++;
-          log.warn(e, "Failed to run indexSpec: [%s].\nTrying the next indexSpec.", json);
-        }
-      }
-
-      String msg = StringUtils.format("Ran [%d] specs, [%d] succeeded, [%d] failed",
-                                      totalNumSpecs, totalNumSpecs - failCnt, failCnt
-      );
-
-      toolbox.getTaskReportFileWriter().write(getId(), completionReports);
-      log.info(msg);
-      return failCnt == 0 ? TaskStatus.success(getId()) : TaskStatus.failure(getId(), msg);
+    registerResourceCloserOnAbnormalExit(compactionRunner.getCurrentSubTaskHolder());
+    CompactionConfigValidationResult supportsCompactionConfig = compactionRunner.validateCompactionTask(this);
+    if (!supportsCompactionConfig.isValid()) {
+      throw InvalidInput.exception("Compaction spec not supported. Reason[%s].", supportsCompactionConfig.getReason());
     }
-  }
-
-  @VisibleForTesting
-  ParallelIndexSupervisorTask newTask(String baseSequenceName, ParallelIndexIngestionSpec ingestionSpec)
-  {
-    return new ParallelIndexSupervisorTask(
-        getId(),
-        getGroupId(),
-        getTaskResource(),
-        ingestionSpec,
-        baseSequenceName,
-        createContextForSubtask(),
-        true
-    );
-  }
-
-  @VisibleForTesting
-  Map<String, Object> createContextForSubtask()
-  {
-    final Map<String, Object> newContext = new HashMap<>(getContext());
-    newContext.put(CTX_KEY_APPENDERATOR_TRACKING_TASK_ID, getId());
-    newContext.putIfAbsent(CompactSegments.STORE_COMPACTION_STATE_KEY, STORE_COMPACTION_STATE);
-    // Set the priority of the compaction task.
-    newContext.put(Tasks.PRIORITY_KEY, getPriority());
-    return newContext;
-  }
-
-  private String createIndexTaskSpecId(int i)
-  {
-    return StringUtils.format("%s_%d", getId(), i);
+    return compactionRunner.runCompactionTasks(this, intervalDataSchemas, toolbox);
   }
 
   /**
-   * Generate {@link ParallelIndexIngestionSpec} from input segments.
-   *
-   * @return an empty list if input segments don't exist. Otherwise, a generated ingestionSpec.
+   * Generate dataschema for segments in each interval
+   * @return
+   * @throws IOException
    */
   @VisibleForTesting
-  static List<ParallelIndexIngestionSpec> createIngestionSchema(
+  static Map<Interval, DataSchema> createDataSchemasForIntervals(
       final Clock clock,
       final TaskToolbox toolbox,
       final LockGranularity lockGranularityInUse,
-      final CompactionIOConfig ioConfig,
       final SegmentProvider segmentProvider,
-      final PartitionConfigurationManager partitionConfigurationManager,
       @Nullable final DimensionsSpec dimensionsSpec,
       @Nullable final ClientCompactionTaskTransformSpec transformSpec,
       @Nullable final AggregatorFactory[] metricsSpec,
       @Nullable final ClientCompactionTaskGranularitySpec granularitySpec,
-      final CoordinatorClient coordinatorClient,
-      final SegmentCacheManagerFactory segmentCacheManagerFactory,
       final ServiceMetricEvent.Builder metricBuilder
   ) throws IOException
   {
@@ -619,14 +512,12 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
         lockGranularityInUse
     );
 
-    if (timelineSegments.size() == 0) {
-      return Collections.emptyList();
+    if (timelineSegments.isEmpty()) {
+      return Collections.emptyMap();
     }
 
-    final CompactionTuningConfig compactionTuningConfig = partitionConfigurationManager.computeTuningConfig();
-
     if (granularitySpec == null || granularitySpec.getSegmentGranularity() == null) {
-      final List<ParallelIndexIngestionSpec> specs = new ArrayList<>();
+      Map<Interval, DataSchema> intervalDataSchemaMap = new HashMap<>();
 
       // original granularity
       final Map<Interval, List<DataSegment>> intervalToSegments = new TreeMap<>(
@@ -679,24 +570,9 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
             ? new ClientCompactionTaskGranularitySpec(segmentGranularityToUse, null, null)
             : granularitySpec.withSegmentGranularity(segmentGranularityToUse)
         );
-
-        specs.add(
-            new ParallelIndexIngestionSpec(
-                dataSchema,
-                createIoConfig(
-                    toolbox,
-                    dataSchema,
-                    interval,
-                    coordinatorClient,
-                    segmentCacheManagerFactory,
-                    ioConfig
-                ),
-                compactionTuningConfig
-            )
-        );
+        intervalDataSchemaMap.put(interval, dataSchema);
       }
-
-      return specs;
+      return intervalDataSchemaMap;
     } else {
       // given segment granularity
       final DataSchema dataSchema = createDataSchema(
@@ -720,70 +596,10 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
           metricsSpec,
           granularitySpec
       );
-
-      return Collections.singletonList(
-          new ParallelIndexIngestionSpec(
-              dataSchema,
-              createIoConfig(
-                  toolbox,
-                  dataSchema,
-                  segmentProvider.interval,
-                  coordinatorClient,
-                  segmentCacheManagerFactory,
-                  ioConfig
-              ),
-              compactionTuningConfig
-          )
-      );
+      return Collections.singletonMap(segmentProvider.interval, dataSchema);
     }
   }
 
-  private static ParallelIndexIOConfig createIoConfig(
-      TaskToolbox toolbox,
-      DataSchema dataSchema,
-      Interval interval,
-      CoordinatorClient coordinatorClient,
-      SegmentCacheManagerFactory segmentCacheManagerFactory,
-      CompactionIOConfig compactionIOConfig
-  )
-  {
-    if (!compactionIOConfig.isAllowNonAlignedInterval()) {
-      // Validate interval alignment.
-      final Granularity segmentGranularity = dataSchema.getGranularitySpec().getSegmentGranularity();
-      final Interval widenedInterval = Intervals.utc(
-          segmentGranularity.bucketStart(interval.getStart()).getMillis(),
-          segmentGranularity.bucketEnd(interval.getEnd().minus(1)).getMillis()
-      );
-
-      if (!interval.equals(widenedInterval)) {
-        throw new IAE(
-            "Interval[%s] to compact is not aligned with segmentGranularity[%s]",
-            interval,
-            segmentGranularity
-        );
-      }
-    }
-
-    return new ParallelIndexIOConfig(
-        null,
-        new DruidInputSource(
-            dataSchema.getDataSource(),
-            interval,
-            null,
-            null,
-            null,
-            null,
-            toolbox.getIndexIO(),
-            coordinatorClient,
-            segmentCacheManagerFactory,
-            toolbox.getConfig()
-        ).withTaskToolbox(toolbox),
-        null,
-        false,
-        compactionIOConfig.isDropExisting()
-    );
-  }
-
   private static List<TimelineObjectHolder<String, DataSegment>> retrieveRelevantTimelineHolders(
       TaskToolbox toolbox,
       SegmentProvider segmentProvider,
@@ -1213,35 +1029,6 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
     }
   }
 
-  @VisibleForTesting
-  static class PartitionConfigurationManager
-  {
-    @Nullable
-    private final CompactionTuningConfig tuningConfig;
-
-    PartitionConfigurationManager(@Nullable CompactionTuningConfig tuningConfig)
-    {
-      this.tuningConfig = tuningConfig;
-    }
-
-    @Nullable
-    CompactionTuningConfig computeTuningConfig()
-    {
-      CompactionTuningConfig newTuningConfig = tuningConfig == null
-                                               ? CompactionTuningConfig.defaultConfig()
-                                               : tuningConfig;
-      PartitionsSpec partitionsSpec = newTuningConfig.getGivenOrDefaultPartitionsSpec();
-      if (partitionsSpec instanceof DynamicPartitionsSpec) {
-        final DynamicPartitionsSpec dynamicPartitionsSpec = (DynamicPartitionsSpec) partitionsSpec;
-        partitionsSpec = new DynamicPartitionsSpec(
-            dynamicPartitionsSpec.getMaxRowsPerSegment(),
-            dynamicPartitionsSpec.getMaxTotalRowsOr(DynamicPartitionsSpec.DEFAULT_COMPACTION_MAX_TOTAL_ROWS)
-        );
-      }
-      return newTuningConfig.withPartitionsSpec(partitionsSpec);
-    }
-  }
-
   public static class Builder
   {
     private final String dataSource;
@@ -1263,6 +1050,7 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
     private TuningConfig tuningConfig;
     @Nullable
     private Map<String, Object> context;
+    private CompactionRunner compactionRunner;
 
     public Builder(
         String dataSource,
@@ -1345,6 +1133,12 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
       return this;
     }
 
+    public Builder compactionRunner(CompactionRunner compactionRunner)
+    {
+      this.compactionRunner = compactionRunner;
+      return this;
+    }
+
     public CompactionTask build()
     {
       return new CompactionTask(
@@ -1362,6 +1156,7 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
           granularitySpec,
           tuningConfig,
           context,
+          compactionRunner,
           segmentCacheManagerFactory
       );
     }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/NativeCompactionRunner.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/NativeCompactionRunner.java
new file mode 100644
index 00000000000..722c6010b20
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/NativeCompactionRunner.java
@@ -0,0 +1,333 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.task;
+
+import com.fasterxml.jackson.annotation.JacksonInject;
+import com.fasterxml.jackson.annotation.JsonIgnore;
+import com.fasterxml.jackson.core.JsonProcessingException;
+import com.google.common.annotations.VisibleForTesting;
+import org.apache.druid.client.coordinator.CoordinatorClient;
+import org.apache.druid.indexer.TaskStatus;
+import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
+import org.apache.druid.indexer.partitions.PartitionsSpec;
+import org.apache.druid.indexer.report.TaskReport;
+import org.apache.druid.indexing.common.SegmentCacheManagerFactory;
+import org.apache.druid.indexing.common.TaskToolbox;
+import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexIOConfig;
+import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexIngestionSpec;
+import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexSupervisorTask;
+import org.apache.druid.indexing.input.DruidInputSource;
+import org.apache.druid.java.util.common.IAE;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.java.util.common.granularity.Granularity;
+import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.segment.indexing.DataSchema;
+import org.apache.druid.server.coordinator.CompactionConfigValidationResult;
+import org.apache.druid.server.coordinator.duty.CompactSegments;
+import org.apache.druid.utils.CollectionUtils;
+import org.codehaus.jackson.annotate.JsonCreator;
+import org.joda.time.Interval;
+
+import javax.annotation.Nullable;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.Optional;
+import java.util.stream.Collectors;
+import java.util.stream.IntStream;
+
+public class NativeCompactionRunner implements CompactionRunner
+{
+  private static final Logger log = new Logger(NativeCompactionRunner.class);
+  public static final String TYPE = "native";
+  private static final boolean STORE_COMPACTION_STATE = true;
+  @JsonIgnore
+  private final SegmentCacheManagerFactory segmentCacheManagerFactory;
+  @JsonIgnore
+  private final CurrentSubTaskHolder currentSubTaskHolder = new CurrentSubTaskHolder(
+      (taskObject, config) -> {
+        final ParallelIndexSupervisorTask indexTask = (ParallelIndexSupervisorTask) taskObject;
+        indexTask.stopGracefully(config);
+      });
+
+  @JsonCreator
+  public NativeCompactionRunner(@JacksonInject SegmentCacheManagerFactory segmentCacheManagerFactory)
+  {
+    this.segmentCacheManagerFactory = segmentCacheManagerFactory;
+  }
+
+  @Override
+  public CurrentSubTaskHolder getCurrentSubTaskHolder()
+  {
+    return currentSubTaskHolder;
+  }
+
+  @Override
+  public CompactionConfigValidationResult validateCompactionTask(
+      CompactionTask compactionTask
+  )
+  {
+    return new CompactionConfigValidationResult(true, null);
+  }
+
+  /**
+   * Generate {@link ParallelIndexIngestionSpec} from input dataschemas.
+   *
+   * @return an empty list if input segments don't exist. Otherwise, a generated ingestionSpec.
+   */
+  @VisibleForTesting
+  static List<ParallelIndexIngestionSpec> createIngestionSpecs(
+      Map<Interval, DataSchema> intervalDataSchemaMap,
+      final TaskToolbox toolbox,
+      final CompactionIOConfig ioConfig,
+      final PartitionConfigurationManager partitionConfigurationManager,
+      final CoordinatorClient coordinatorClient,
+      final SegmentCacheManagerFactory segmentCacheManagerFactory
+  )
+  {
+    final CompactionTask.CompactionTuningConfig compactionTuningConfig = partitionConfigurationManager.computeTuningConfig();
+
+    return intervalDataSchemaMap.entrySet().stream().map((dataSchema) -> new ParallelIndexIngestionSpec(
+                                        dataSchema.getValue(),
+                                        createIoConfig(
+                                            toolbox,
+                                            dataSchema.getValue(),
+                                            dataSchema.getKey(),
+                                            coordinatorClient,
+                                            segmentCacheManagerFactory,
+                                            ioConfig
+                                        ),
+                                        compactionTuningConfig
+                                    )
+
+    ).collect(Collectors.toList());
+  }
+
+  private String createIndexTaskSpecId(String taskId, int i)
+  {
+    return StringUtils.format("%s_%d", taskId, i);
+  }
+
+
+  private static ParallelIndexIOConfig createIoConfig(
+      TaskToolbox toolbox,
+      DataSchema dataSchema,
+      Interval interval,
+      CoordinatorClient coordinatorClient,
+      SegmentCacheManagerFactory segmentCacheManagerFactory,
+      CompactionIOConfig compactionIOConfig
+  )
+  {
+    if (!compactionIOConfig.isAllowNonAlignedInterval()) {
+      // Validate interval alignment.
+      final Granularity segmentGranularity = dataSchema.getGranularitySpec().getSegmentGranularity();
+      final Interval widenedInterval = Intervals.utc(
+          segmentGranularity.bucketStart(interval.getStart()).getMillis(),
+          segmentGranularity.bucketEnd(interval.getEnd().minus(1)).getMillis()
+      );
+
+      if (!interval.equals(widenedInterval)) {
+        throw new IAE(
+            "Interval[%s] to compact is not aligned with segmentGranularity[%s]",
+            interval,
+            segmentGranularity
+        );
+      }
+    }
+
+    return new ParallelIndexIOConfig(
+        null,
+        new DruidInputSource(
+            dataSchema.getDataSource(),
+            interval,
+            null,
+            null,
+            null,
+            null,
+            toolbox.getIndexIO(),
+            coordinatorClient,
+            segmentCacheManagerFactory,
+            toolbox.getConfig()
+        ).withTaskToolbox(toolbox),
+        null,
+        false,
+        compactionIOConfig.isDropExisting()
+    );
+  }
+
+  @Override
+  public TaskStatus runCompactionTasks(
+      CompactionTask compactionTask,
+      Map<Interval, DataSchema> intervalDataSchemaMap,
+      TaskToolbox taskToolbox
+  ) throws Exception
+  {
+    final PartitionConfigurationManager partitionConfigurationManager =
+        new NativeCompactionRunner.PartitionConfigurationManager(compactionTask.getTuningConfig());
+
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = createIngestionSpecs(
+        intervalDataSchemaMap,
+        taskToolbox,
+        compactionTask.getIoConfig(),
+        partitionConfigurationManager,
+        taskToolbox.getCoordinatorClient(),
+        segmentCacheManagerFactory
+    );
+
+    List<ParallelIndexSupervisorTask> subtasks = IntStream
+        .range(0, ingestionSpecs.size())
+        .mapToObj(i -> {
+          // The ID of SubtaskSpecs is used as the base sequenceName in segment allocation protocol.
+          // The indexing tasks generated by the compaction task should use different sequenceNames
+          // so that they can allocate valid segment IDs with no duplication.
+          ParallelIndexIngestionSpec ingestionSpec = ingestionSpecs.get(i);
+          final String baseSequenceName = createIndexTaskSpecId(compactionTask.getId(), i);
+          return newTask(compactionTask, baseSequenceName, ingestionSpec);
+        })
+        .collect(Collectors.toList());
+
+    if (subtasks.isEmpty()) {
+      String msg = StringUtils.format(
+          "Can't find segments from inputSpec[%s], nothing to do.",
+          compactionTask.getIoConfig().getInputSpec()
+      );
+      log.warn(msg);
+      return TaskStatus.failure(compactionTask.getId(), msg);
+    }
+    return runParallelIndexSubtasks(
+        subtasks,
+        taskToolbox,
+        currentSubTaskHolder,
+        compactionTask.getId()
+    );
+  }
+
+  private TaskStatus runParallelIndexSubtasks(
+      List<ParallelIndexSupervisorTask> tasks,
+      TaskToolbox toolbox,
+      CurrentSubTaskHolder currentSubTaskHolder,
+      String compactionTaskId
+  )
+      throws JsonProcessingException
+  {
+    final int totalNumSpecs = tasks.size();
+    log.info("Generated [%d] compaction task specs", totalNumSpecs);
+
+    int failCnt = 0;
+    final TaskReport.ReportMap completionReports = new TaskReport.ReportMap();
+    for (int i = 0; i < tasks.size(); i++) {
+      ParallelIndexSupervisorTask eachSpec = tasks.get(i);
+      final String json = toolbox.getJsonMapper().writerWithDefaultPrettyPrinter().writeValueAsString(eachSpec);
+      if (!currentSubTaskHolder.setTask(eachSpec)) {
+        String errMsg = "Task was asked to stop. Finish as failed.";
+        log.info(errMsg);
+        return TaskStatus.failure(compactionTaskId, errMsg);
+      }
+      try {
+        if (eachSpec.isReady(toolbox.getTaskActionClient())) {
+          log.info("Running indexSpec: " + json);
+          final TaskStatus eachResult = eachSpec.run(toolbox);
+          if (!eachResult.isSuccess()) {
+            failCnt++;
+            log.warn("Failed to run indexSpec: [%s].\nTrying the next indexSpec.", json);
+          }
+
+          String reportKeySuffix = "_" + i;
+          Optional.ofNullable(eachSpec.getCompletionReports())
+                  .ifPresent(reports -> completionReports.putAll(
+                      CollectionUtils.mapKeys(reports, key -> key + reportKeySuffix)));
+        } else {
+          failCnt++;
+          log.warn("indexSpec is not ready: [%s].\nTrying the next indexSpec.", json);
+        }
+      }
+      catch (Exception e) {
+        failCnt++;
+        log.warn(e, "Failed to run indexSpec: [%s].\nTrying the next indexSpec.", json);
+      }
+    }
+
+    String msg = StringUtils.format(
+        "Ran [%d] specs, [%d] succeeded, [%d] failed",
+        totalNumSpecs,
+        totalNumSpecs - failCnt,
+        failCnt
+    );
+
+    toolbox.getTaskReportFileWriter().write(compactionTaskId, completionReports);
+    log.info(msg);
+    return failCnt == 0 ? TaskStatus.success(compactionTaskId) : TaskStatus.failure(compactionTaskId, msg);
+  }
+
+  @VisibleForTesting
+  ParallelIndexSupervisorTask newTask(CompactionTask compactionTask, String baseSequenceName, ParallelIndexIngestionSpec ingestionSpec)
+  {
+    return new ParallelIndexSupervisorTask(
+        compactionTask.getId(),
+        compactionTask.getGroupId(),
+        compactionTask.getTaskResource(),
+        ingestionSpec,
+        baseSequenceName,
+        createContextForSubtask(compactionTask),
+        true
+    );
+  }
+
+  Map<String, Object> createContextForSubtask(CompactionTask compactionTask)
+  {
+    final Map<String, Object> newContext = new HashMap<>(compactionTask.getContext());
+    newContext.put(CompactionTask.CTX_KEY_APPENDERATOR_TRACKING_TASK_ID, compactionTask.getId());
+    newContext.putIfAbsent(CompactSegments.STORE_COMPACTION_STATE_KEY, STORE_COMPACTION_STATE);
+    // Set the priority of the compaction task.
+    newContext.put(Tasks.PRIORITY_KEY, compactionTask.getPriority());
+    return newContext;
+  }
+
+  @VisibleForTesting
+  static class PartitionConfigurationManager
+  {
+    @Nullable
+    private final CompactionTask.CompactionTuningConfig tuningConfig;
+
+    PartitionConfigurationManager(@Nullable CompactionTask.CompactionTuningConfig tuningConfig)
+    {
+      this.tuningConfig = tuningConfig;
+    }
+
+    @Nullable
+    CompactionTask.CompactionTuningConfig computeTuningConfig()
+    {
+      CompactionTask.CompactionTuningConfig newTuningConfig = tuningConfig == null
+                                               ? CompactionTask.CompactionTuningConfig.defaultConfig()
+                                               : tuningConfig;
+      PartitionsSpec partitionsSpec = newTuningConfig.getGivenOrDefaultPartitionsSpec();
+      if (partitionsSpec instanceof DynamicPartitionsSpec) {
+        final DynamicPartitionsSpec dynamicPartitionsSpec = (DynamicPartitionsSpec) partitionsSpec;
+        partitionsSpec = new DynamicPartitionsSpec(
+            dynamicPartitionsSpec.getMaxRowsPerSegment(),
+            dynamicPartitionsSpec.getMaxTotalRowsOr(DynamicPartitionsSpec.DEFAULT_COMPACTION_MAX_TOTAL_ROWS)
+        );
+      }
+      return newTuningConfig.withPartitionsSpec(partitionsSpec);
+    }
+  }
+}
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java
index 71514af17b4..3d6c8085c98 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java
@@ -28,6 +28,7 @@ import org.apache.druid.client.coordinator.CoordinatorClient;
 import org.apache.druid.client.coordinator.NoopCoordinatorClient;
 import org.apache.druid.client.indexing.ClientCompactionIOConfig;
 import org.apache.druid.client.indexing.ClientCompactionIntervalSpec;
+import org.apache.druid.client.indexing.ClientCompactionRunnerInfo;
 import org.apache.druid.client.indexing.ClientCompactionTaskDimensionsSpec;
 import org.apache.druid.client.indexing.ClientCompactionTaskGranularitySpec;
 import org.apache.druid.client.indexing.ClientCompactionTaskQuery;
@@ -40,6 +41,7 @@ import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.guice.GuiceAnnotationIntrospector;
 import org.apache.druid.guice.GuiceInjectableValues;
 import org.apache.druid.guice.GuiceInjectors;
+import org.apache.druid.indexer.CompactionEngine;
 import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.indexing.common.RetryPolicyConfig;
 import org.apache.druid.indexing.common.RetryPolicyFactory;
@@ -329,7 +331,8 @@ public class ClientCompactionTaskQuerySerdeTest
         new ClientCompactionTaskDimensionsSpec(DimensionsSpec.getDefaultSchemas(ImmutableList.of("ts", "dim"))),
         METRICS_SPEC,
         transformSpec,
-        context
+        context,
+        new ClientCompactionRunnerInfo(CompactionEngine.NATIVE)
     );
   }
 
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
index 134f5305169..48a7932a241 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
@@ -68,9 +68,9 @@ import org.apache.druid.indexing.common.actions.TaskActionClient;
 import org.apache.druid.indexing.common.config.TaskConfig;
 import org.apache.druid.indexing.common.config.TaskConfigBuilder;
 import org.apache.druid.indexing.common.task.CompactionTask.Builder;
-import org.apache.druid.indexing.common.task.CompactionTask.PartitionConfigurationManager;
 import org.apache.druid.indexing.common.task.CompactionTask.SegmentProvider;
 import org.apache.druid.indexing.common.task.IndexTask.IndexTuningConfig;
+import org.apache.druid.indexing.common.task.NativeCompactionRunner.PartitionConfigurationManager;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexIOConfig;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexIngestionSpec;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexTuningConfig;
@@ -447,8 +447,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
     );
     builder.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
     builder.tuningConfig(createTuningConfig());
@@ -478,8 +477,7 @@ public class CompactionTaskTest
         new ClientCompactionTaskTransformSpec(new SelectorDimFilter("dim1", "foo", null));
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
     );
     builder.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
     builder.tuningConfig(createTuningConfig());
@@ -911,21 +909,27 @@ public class CompactionTaskTest
   @Test
   public void testCreateIngestionSchema() throws IOException
   {
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
     final List<DimensionsSpec> expectedDimensionsSpec = getExpectedDimensionsSpecForAutoGeneration();
 
     ingestionSpecs.sort(
@@ -987,21 +991,27 @@ public class CompactionTaskTest
         null,
         null
     );
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(tuningConfig),
         null,
         null,
         null,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(tuningConfig),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
     final List<DimensionsSpec> expectedDimensionsSpec = getExpectedDimensionsSpecForAutoGeneration();
 
     ingestionSpecs.sort(
@@ -1064,21 +1074,27 @@ public class CompactionTaskTest
         null,
         null
     );
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(tuningConfig),
         null,
         null,
         null,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(tuningConfig),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
     final List<DimensionsSpec> expectedDimensionsSpec = getExpectedDimensionsSpecForAutoGeneration();
 
     ingestionSpecs.sort(
@@ -1141,21 +1157,26 @@ public class CompactionTaskTest
         null,
         null
     );
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(tuningConfig),
         null,
         null,
         null,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(tuningConfig),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
     final List<DimensionsSpec> expectedDimensionsSpec = getExpectedDimensionsSpecForAutoGeneration();
 
     ingestionSpecs.sort(
@@ -1207,22 +1228,27 @@ public class CompactionTaskTest
         )
     );
 
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         customSpec,
         null,
         null,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
 
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
     ingestionSpecs.sort(
         (s1, s2) -> Comparators.intervalsByStartThenEnd().compare(
             s1.getDataSchema().getGranularitySpec().inputIntervals().get(0),
@@ -1253,22 +1279,27 @@ public class CompactionTaskTest
         new DoubleMaxAggregatorFactory("custom_double_max", "agg_4")
     };
 
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         customMetricsSpec,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
 
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
     final List<DimensionsSpec> expectedDimensionsSpec = getExpectedDimensionsSpecForAutoGeneration();
 
     ingestionSpecs.sort(
@@ -1292,21 +1323,27 @@ public class CompactionTaskTest
   @Test
   public void testCreateIngestionSchemaWithCustomSegments() throws IOException
   {
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
-        new SegmentProvider(DATA_SOURCE, SpecificSegmentsSpec.fromSegments(SEGMENTS)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
+        new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
         null,
         null,
         null,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
     final List<DimensionsSpec> expectedDimensionsSpec = getExpectedDimensionsSpecForAutoGeneration();
 
     ingestionSpecs.sort(
@@ -1337,21 +1374,26 @@ public class CompactionTaskTest
     Collections.sort(segments);
     // Remove one segment in the middle
     segments.remove(segments.size() / 2);
-    CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, SpecificSegmentsSpec.fromSegments(segments)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
   }
 
   @Test
@@ -1363,21 +1405,26 @@ public class CompactionTaskTest
     final TestIndexIO indexIO = (TestIndexIO) toolbox.getIndexIO();
     indexIO.removeMetadata(Iterables.getFirst(indexIO.getQueryableIndexMap().keySet(), null));
     final List<DataSegment> segments = new ArrayList<>(SEGMENTS);
-    CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, SpecificSegmentsSpec.fromSegments(segments)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
   }
 
   @Test
@@ -1388,8 +1435,7 @@ public class CompactionTaskTest
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
     );
 
     @SuppressWarnings("unused")
@@ -1401,21 +1447,26 @@ public class CompactionTaskTest
   @Test
   public void testSegmentGranularityAndNullQueryGranularity() throws IOException
   {
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
         new ClientCompactionTaskGranularitySpec(new PeriodGranularity(Period.months(3), null, null), null, null),
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
     final List<DimensionsSpec> expectedDimensionsSpec = ImmutableList.of(
         new DimensionsSpec(getDimensionSchema(new DoubleDimensionSchema("string_to_double")))
     );
@@ -1441,21 +1492,25 @@ public class CompactionTaskTest
   @Test
   public void testQueryGranularityAndNullSegmentGranularity() throws IOException
   {
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
         new ClientCompactionTaskGranularitySpec(null, new PeriodGranularity(Period.months(3), null, null), null),
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
     final List<DimensionsSpec> expectedDimensionsSpec = getExpectedDimensionsSpecForAutoGeneration();
 
     ingestionSpecs.sort(
@@ -1479,13 +1534,11 @@ public class CompactionTaskTest
   @Test
   public void testQueryGranularityAndSegmentGranularityNonNull() throws IOException
   {
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
@@ -1494,10 +1547,19 @@ public class CompactionTaskTest
             new PeriodGranularity(Period.months(3), null, null),
             null
         ),
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
+
     final List<DimensionsSpec> expectedDimensionsSpec = ImmutableList.of(
         new DimensionsSpec(getDimensionSchema(new DoubleDimensionSchema("string_to_double")))
     );
@@ -1524,21 +1586,28 @@ public class CompactionTaskTest
   @Test
   public void testNullGranularitySpec() throws IOException
   {
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
         null,
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
+
     final List<DimensionsSpec> expectedDimensionsSpec = getExpectedDimensionsSpecForAutoGeneration();
 
     ingestionSpecs.sort(
@@ -1563,21 +1632,28 @@ public class CompactionTaskTest
   public void testGranularitySpecWithNullQueryGranularityAndNullSegmentGranularity()
       throws IOException
   {
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
         new ClientCompactionTaskGranularitySpec(null, null, null),
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
+
     final List<DimensionsSpec> expectedDimensionsSpec = getExpectedDimensionsSpecForAutoGeneration();
 
     ingestionSpecs.sort(
@@ -1602,22 +1678,27 @@ public class CompactionTaskTest
   public void testGranularitySpecWithNotNullRollup()
       throws IOException
   {
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
         new ClientCompactionTaskGranularitySpec(null, null, true),
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
 
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
     Assert.assertEquals(6, ingestionSpecs.size());
     for (ParallelIndexIngestionSpec indexIngestionSpec : ingestionSpecs) {
       Assert.assertTrue(indexIngestionSpec.getDataSchema().getGranularitySpec().isRollup());
@@ -1628,21 +1709,28 @@ public class CompactionTaskTest
   public void testGranularitySpecWithNullRollup()
       throws IOException
   {
-    final List<ParallelIndexIngestionSpec> ingestionSpecs = CompactionTask.createIngestionSchema(
+    final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
-        new CompactionIOConfig(null, false, null),
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
-        new PartitionConfigurationManager(TUNING_CONFIG),
         null,
         null,
         null,
         new ClientCompactionTaskGranularitySpec(null, null, null),
-        COORDINATOR_CLIENT,
-        segmentCacheManagerFactory,
         METRIC_BUILDER
     );
+
+    final List<ParallelIndexIngestionSpec> ingestionSpecs = NativeCompactionRunner.createIngestionSpecs(
+        dataSchemasForIntervals,
+        toolbox,
+        new CompactionIOConfig(null, false, null),
+        new PartitionConfigurationManager(TUNING_CONFIG),
+        COORDINATOR_CLIENT,
+        segmentCacheManagerFactory
+    );
+
+
     Assert.assertEquals(6, ingestionSpecs.size());
     for (ParallelIndexIngestionSpec indexIngestionSpec : ingestionSpecs) {
       //Expect false since rollup value in metadata of existing segments are null
@@ -1701,8 +1789,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
     );
     final CompactionTask task = builder
         .interval(Intervals.of("2000-01-01/2000-01-02"))
@@ -1715,8 +1802,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
     );
     final CompactionTask task = builder
         .interval(Intervals.of("2000-01-01/2000-01-02"))
diff --git a/integration-tests/docker/environment-configs/common b/integration-tests/docker/environment-configs/common
index 3ce06d90ea2..e99ee2acd43 100644
--- a/integration-tests/docker/environment-configs/common
+++ b/integration-tests/docker/environment-configs/common
@@ -28,7 +28,7 @@ DRUID_DEP_LIB_DIR=/shared/hadoop_xml:/shared/docker/lib/*:/usr/local/druid/lib/m
 
 # Druid configs
 # If you are making a change in load list below, make the necessary changes in github actions too
-druid_extensions_loadList=["mysql-metadata-storage","druid-basic-security","simple-client-sslcontext","druid-testing-tools","druid-lookups-cached-global","druid-histogram","druid-datasketches","druid-parquet-extensions","druid-avro-extensions","druid-protobuf-extensions","druid-orc-extensions","druid-kafka-indexing-service","druid-s3-extensions"]
+druid_extensions_loadList=["mysql-metadata-storage","druid-basic-security","simple-client-sslcontext","druid-testing-tools","druid-lookups-cached-global","druid-histogram","druid-datasketches","druid-parquet-extensions","druid-avro-extensions","druid-protobuf-extensions","druid-orc-extensions","druid-kafka-indexing-service","druid-s3-extensions","druid-multi-stage-query"]
 druid_startup_logging_logProperties=true
 druid_extensions_directory=/shared/docker/extensions
 druid_auth_authenticator_basic_authorizerName=basic
diff --git a/integration-tests/src/main/java/org/apache/druid/testing/utils/CompactionUtil.java b/integration-tests/src/main/java/org/apache/druid/testing/utils/CompactionUtil.java
index a57a404b61e..63316e76687 100644
--- a/integration-tests/src/main/java/org/apache/druid/testing/utils/CompactionUtil.java
+++ b/integration-tests/src/main/java/org/apache/druid/testing/utils/CompactionUtil.java
@@ -75,6 +75,7 @@ public class CompactionUtil
         null,
         null,
         new UserCompactionTaskIOConfig(true),
+        null,
         null
     );
   }
diff --git a/integration-tests/src/test/java/org/apache/druid/tests/coordinator/duty/ITAutoCompactionTest.java b/integration-tests/src/test/java/org/apache/druid/tests/coordinator/duty/ITAutoCompactionTest.java
index 26df03e0d81..230a19236c1 100644
--- a/integration-tests/src/test/java/org/apache/druid/tests/coordinator/duty/ITAutoCompactionTest.java
+++ b/integration-tests/src/test/java/org/apache/druid/tests/coordinator/duty/ITAutoCompactionTest.java
@@ -26,6 +26,7 @@ import org.apache.commons.io.IOUtils;
 import org.apache.datasketches.hll.TgtHllType;
 import org.apache.druid.data.input.MaxSizeSplitHintSpec;
 import org.apache.druid.data.input.impl.DimensionsSpec;
+import org.apache.druid.indexer.CompactionEngine;
 import org.apache.druid.indexer.TaskState;
 import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
@@ -75,9 +76,11 @@ import org.joda.time.Period;
 import org.joda.time.chrono.ISOChronology;
 import org.testng.Assert;
 import org.testng.annotations.BeforeMethod;
+import org.testng.annotations.DataProvider;
 import org.testng.annotations.Guice;
 import org.testng.annotations.Test;
 
+import javax.annotation.Nullable;
 import java.io.Closeable;
 import java.io.IOException;
 import java.io.InputStream;
@@ -106,6 +109,12 @@ public class ITAutoCompactionTest extends AbstractIndexerTest
   private static final int MAX_ROWS_PER_SEGMENT_COMPACTED = 10000;
   private static final Period NO_SKIP_OFFSET = Period.seconds(0);
 
+  @DataProvider(name = "engine")
+  public static Object[][] engine()
+  {
+    return new Object[][]{{CompactionEngine.NATIVE}, {CompactionEngine.MSQ}};
+  }
+
   @Inject
   protected CompactionResourceTestClient compactionResource;
 
@@ -383,6 +392,61 @@ public class ITAutoCompactionTest extends AbstractIndexerTest
     }
   }
 
+  @Test(dataProvider = "engine")
+  public void testAutoCompactionWithMetricColumnSameAsInputColShouldOverwriteInputWithMetrics(CompactionEngine engine)
+      throws Exception
+  {
+    // added = 31
+    loadData(INDEX_TASK_WITHOUT_ROLLUP_FOR_PRESERVE_METRICS);
+    // added = 31
+    loadData(INDEX_TASK_WITHOUT_ROLLUP_FOR_PRESERVE_METRICS);
+    if (engine == CompactionEngine.MSQ) {
+      updateCompactionTaskSlot(0.1, 2, false);
+    }
+    try (final Closeable ignored = unloader(fullDatasourceName)) {
+      final List<String> intervalsBeforeCompaction = coordinator.getSegmentIntervals(fullDatasourceName);
+      intervalsBeforeCompaction.sort(null);
+      // 2 segments across 1 days...
+      verifySegmentsCount(2);
+      Map<String, Object> queryAndResultFields = ImmutableMap.of(
+          "%%FIELD_TO_QUERY%%", "added",
+          "%%EXPECTED_COUNT_RESULT%%", 2,
+          "%%EXPECTED_SCAN_RESULT%%", ImmutableList.of(ImmutableMap.of("events", ImmutableList.of(ImmutableList.of(31))), ImmutableMap.of("events", ImmutableList.of(ImmutableList.of(31))))
+      );
+      verifyQuery(INDEX_ROLLUP_QUERIES_RESOURCE, queryAndResultFields);
+
+      submitCompactionConfig(
+          MAX_ROWS_PER_SEGMENT_COMPACTED,
+          NO_SKIP_OFFSET,
+          new UserCompactionTaskGranularityConfig(null, null, true),
+          new UserCompactionTaskDimensionsConfig(DimensionsSpec.getDefaultSchemas(ImmutableList.of("language"))),
+          null,
+          new AggregatorFactory[] {new LongSumAggregatorFactory("added", "added")},
+          false,
+          engine
+      );
+      // should now only have 1 row after compaction
+      // added = 62
+      forceTriggerAutoCompaction(1);
+
+      queryAndResultFields = ImmutableMap.of(
+          "%%FIELD_TO_QUERY%%", "added",
+          "%%EXPECTED_COUNT_RESULT%%", 1,
+          "%%EXPECTED_SCAN_RESULT%%", ImmutableList.of(ImmutableMap.of("events", ImmutableList.of(ImmutableList.of(62))))
+      );
+      verifyQuery(INDEX_ROLLUP_QUERIES_RESOURCE, queryAndResultFields);
+
+      verifySegmentsCompacted(1, MAX_ROWS_PER_SEGMENT_COMPACTED);
+      checkCompactionIntervals(intervalsBeforeCompaction);
+
+      List<TaskResponseObject> compactTasksBefore = indexer.getCompleteTasksForDataSource(fullDatasourceName);
+      // Verify rollup segments does not get compacted again
+      forceTriggerAutoCompaction(1);
+      List<TaskResponseObject> compactTasksAfter = indexer.getCompleteTasksForDataSource(fullDatasourceName);
+      Assert.assertEquals(compactTasksAfter.size(), compactTasksBefore.size());
+    }
+  }
+
   @Test
   public void testAutoCompactionOnlyRowsWithMetricShouldPreserveExistingMetrics() throws Exception
   {
@@ -546,8 +610,8 @@ public class ITAutoCompactionTest extends AbstractIndexerTest
     }
   }
 
-  @Test
-  public void testAutoCompactionDutyCanDeleteCompactionConfig() throws Exception
+  @Test(dataProvider = "engine")
+  public void testAutoCompactionDutyCanDeleteCompactionConfig(CompactionEngine engine) throws Exception
   {
     loadData(INDEX_TASK);
     try (final Closeable ignored = unloader(fullDatasourceName)) {
@@ -557,7 +621,7 @@ public class ITAutoCompactionTest extends AbstractIndexerTest
       verifySegmentsCount(4);
       verifyQuery(INDEX_QUERIES_RESOURCE);
 
-      submitCompactionConfig(MAX_ROWS_PER_SEGMENT_COMPACTED, NO_SKIP_OFFSET);
+      submitCompactionConfig(MAX_ROWS_PER_SEGMENT_COMPACTED, NO_SKIP_OFFSET, engine);
       deleteCompactionConfig();
 
       // ...should remains unchanged (4 total)
@@ -1398,7 +1462,7 @@ public class ITAutoCompactionTest extends AbstractIndexerTest
   }
 
   @Test
-  public void testAutoCompactionDutyWithMetricsSpec() throws Exception
+  public void testAutoCompationDutyWithMetricsSpec() throws Exception
   {
     loadData(INDEX_TASK_WITH_DIMENSION_SPEC);
     try (final Closeable ignored = unloader(fullDatasourceName)) {
@@ -1585,24 +1649,115 @@ public class ITAutoCompactionTest extends AbstractIndexerTest
     queryHelper.testQueriesFromString(queryResponseTemplate);
   }
 
-  private void submitCompactionConfig(Integer maxRowsPerSegment, Period skipOffsetFromLatest) throws Exception
+  private void submitCompactionConfig(Integer maxRowsPerSegment, Period skipOffsetFromLatest)
+      throws Exception
   {
-    submitCompactionConfig(maxRowsPerSegment, skipOffsetFromLatest, null);
+    submitCompactionConfig(maxRowsPerSegment, skipOffsetFromLatest, null, null);
   }
 
-  private void submitCompactionConfig(Integer maxRowsPerSegment, Period skipOffsetFromLatest, UserCompactionTaskGranularityConfig granularitySpec) throws Exception
+  private void submitCompactionConfig(
+      Integer maxRowsPerSegment,
+      Period skipOffsetFromLatest,
+      @Nullable CompactionEngine engine
+  ) throws Exception
   {
-    submitCompactionConfig(maxRowsPerSegment, skipOffsetFromLatest, granularitySpec, false);
+    submitCompactionConfig(maxRowsPerSegment, skipOffsetFromLatest, null, engine);
   }
 
-  private void submitCompactionConfig(Integer maxRowsPerSegment, Period skipOffsetFromLatest, UserCompactionTaskGranularityConfig granularitySpec, boolean dropExisting) throws Exception
+  private void submitCompactionConfig(
+      Integer maxRowsPerSegment,
+      Period skipOffsetFromLatest,
+      UserCompactionTaskGranularityConfig granularitySpec
+  ) throws Exception
   {
-    submitCompactionConfig(maxRowsPerSegment, skipOffsetFromLatest, granularitySpec, null, null, null, dropExisting);
+    submitCompactionConfig(maxRowsPerSegment, skipOffsetFromLatest, granularitySpec, false, null);
   }
 
-  private void submitCompactionConfig(Integer maxRowsPerSegment, Period skipOffsetFromLatest, UserCompactionTaskGranularityConfig granularitySpec, UserCompactionTaskDimensionsConfig dimensionsSpec, UserCompactionTaskTransformConfig transformSpec, AggregatorFactory[] metricsSpec, boolean dropExisting) throws Exception
+
+  private void submitCompactionConfig(
+      Integer maxRowsPerSegment,
+      Period skipOffsetFromLatest,
+      UserCompactionTaskGranularityConfig granularitySpec,
+      @Nullable CompactionEngine engine
+  ) throws Exception
   {
-    submitCompactionConfig(new DynamicPartitionsSpec(maxRowsPerSegment, null), skipOffsetFromLatest, 1, granularitySpec, dimensionsSpec, transformSpec, metricsSpec, dropExisting);
+    submitCompactionConfig(maxRowsPerSegment, skipOffsetFromLatest, granularitySpec, false, engine);
+  }
+
+  private void submitCompactionConfig(
+      Integer maxRowsPerSegment,
+      Period skipOffsetFromLatest,
+      UserCompactionTaskGranularityConfig granularitySpec,
+      boolean dropExisting
+  ) throws Exception
+  {
+    submitCompactionConfig(maxRowsPerSegment, skipOffsetFromLatest, granularitySpec, dropExisting, null);
+  }
+
+  private void submitCompactionConfig(
+      Integer maxRowsPerSegment,
+      Period skipOffsetFromLatest,
+      UserCompactionTaskGranularityConfig granularitySpec,
+      boolean dropExisting,
+      @Nullable CompactionEngine engine
+  ) throws Exception
+  {
+    submitCompactionConfig(
+        maxRowsPerSegment,
+        skipOffsetFromLatest,
+        granularitySpec,
+        null,
+        null,
+        null,
+        dropExisting,
+        engine
+    );
+  }
+
+  private void submitCompactionConfig(
+      Integer maxRowsPerSegment,
+      Period skipOffsetFromLatest,
+      UserCompactionTaskGranularityConfig granularitySpec,
+      UserCompactionTaskDimensionsConfig dimensionsSpec,
+      UserCompactionTaskTransformConfig transformSpec,
+      AggregatorFactory[] metricsSpec,
+      boolean dropExisting
+  ) throws Exception
+  {
+    submitCompactionConfig(
+        maxRowsPerSegment,
+        skipOffsetFromLatest,
+        granularitySpec,
+        dimensionsSpec,
+        transformSpec,
+        metricsSpec,
+        dropExisting,
+        null
+    );
+  }
+
+  private void submitCompactionConfig(
+      Integer maxRowsPerSegment,
+      Period skipOffsetFromLatest,
+      UserCompactionTaskGranularityConfig granularitySpec,
+      UserCompactionTaskDimensionsConfig dimensionsSpec,
+      UserCompactionTaskTransformConfig transformSpec,
+      AggregatorFactory[] metricsSpec,
+      boolean dropExisting,
+      @Nullable CompactionEngine engine
+  ) throws Exception
+  {
+    submitCompactionConfig(
+        new DynamicPartitionsSpec(maxRowsPerSegment, null),
+        skipOffsetFromLatest,
+        1,
+        granularitySpec,
+        dimensionsSpec,
+        transformSpec,
+        metricsSpec,
+        dropExisting,
+        engine
+    );
   }
 
   private void submitCompactionConfig(
@@ -1615,6 +1770,31 @@ public class ITAutoCompactionTest extends AbstractIndexerTest
       AggregatorFactory[] metricsSpec,
       boolean dropExisting
   ) throws Exception
+  {
+    submitCompactionConfig(
+        partitionsSpec,
+        skipOffsetFromLatest,
+        maxNumConcurrentSubTasks,
+        granularitySpec,
+        dimensionsSpec,
+        transformSpec,
+        metricsSpec,
+        dropExisting,
+        null
+    );
+  }
+
+  private void submitCompactionConfig(
+      PartitionsSpec partitionsSpec,
+      Period skipOffsetFromLatest,
+      int maxNumConcurrentSubTasks,
+      UserCompactionTaskGranularityConfig granularitySpec,
+      UserCompactionTaskDimensionsConfig dimensionsSpec,
+      UserCompactionTaskTransformConfig transformSpec,
+      AggregatorFactory[] metricsSpec,
+      boolean dropExisting,
+      @Nullable CompactionEngine engine
+  ) throws Exception
   {
     DataSourceCompactionConfig compactionConfig = new DataSourceCompactionConfig(
         fullDatasourceName,
@@ -1648,6 +1828,7 @@ public class ITAutoCompactionTest extends AbstractIndexerTest
         metricsSpec,
         transformSpec,
         !dropExisting ? null : new UserCompactionTaskIOConfig(true),
+        engine,
         null
     );
     compactionResource.submitCompactionConfig(compactionConfig);
diff --git a/integration-tests/src/test/java/org/apache/druid/tests/coordinator/duty/ITAutoCompactionUpgradeTest.java b/integration-tests/src/test/java/org/apache/druid/tests/coordinator/duty/ITAutoCompactionUpgradeTest.java
index 9c32cc5055f..9e1b54143bb 100644
--- a/integration-tests/src/test/java/org/apache/druid/tests/coordinator/duty/ITAutoCompactionUpgradeTest.java
+++ b/integration-tests/src/test/java/org/apache/druid/tests/coordinator/duty/ITAutoCompactionUpgradeTest.java
@@ -103,6 +103,7 @@ public class ITAutoCompactionUpgradeTest extends AbstractIndexerTest
         null,
         null,
         new UserCompactionTaskIOConfig(true),
+        null,
         null
     );
     compactionResource.submitCompactionConfig(compactionConfig);
diff --git a/processing/src/main/java/org/apache/druid/indexer/CompactionEngine.java b/processing/src/main/java/org/apache/druid/indexer/CompactionEngine.java
new file mode 100644
index 00000000000..a95f64b896a
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/indexer/CompactionEngine.java
@@ -0,0 +1,49 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexer;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonValue;
+import org.apache.druid.java.util.common.StringUtils;
+
+import javax.annotation.Nullable;
+
+/**
+ * Encapsulates the Engine to be used for a compaction task.
+ * Should be kept in sync with the subtypes for {@link org.apache.druid.indexing.common.task.CompactionRunner}.
+ */
+public enum CompactionEngine
+{
+  NATIVE,
+  MSQ;
+
+  @Override
+  @JsonValue
+  public String toString()
+  {
+    return StringUtils.toLowerCase(this.name());
+  }
+
+  @JsonCreator
+  public static CompactionEngine fromString(@Nullable String name)
+  {
+    return name == null ? null : valueOf(StringUtils.toUpperCase(name));
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/indexer/partitions/SecondaryPartitionType.java b/processing/src/main/java/org/apache/druid/indexer/partitions/SecondaryPartitionType.java
index a8f1a1f8539..45a38c65815 100644
--- a/processing/src/main/java/org/apache/druid/indexer/partitions/SecondaryPartitionType.java
+++ b/processing/src/main/java/org/apache/druid/indexer/partitions/SecondaryPartitionType.java
@@ -43,8 +43,8 @@ public enum SecondaryPartitionType
   /**
    * Range partitioning partitions segments in the same time chunk based on the value range of the partition dimension.
    *
-   * @see SingleDimensionPartitionsSpec
-   * @see org.apache.druid.timeline.partition.SingleDimensionShardSpec
+   * @see DimensionRangePartitionsSpec
+   * @see org.apache.druid.timeline.partition.DimensionRangeShardSpec
    */
   RANGE
 }
diff --git a/processing/src/test/java/org/apache/druid/indexer/CompactionEngineTest.java b/processing/src/test/java/org/apache/druid/indexer/CompactionEngineTest.java
new file mode 100644
index 00000000000..b97a6c6a5ea
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/indexer/CompactionEngineTest.java
@@ -0,0 +1,43 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexer;
+
+import org.junit.Assert;
+import org.junit.Test;
+
+public class CompactionEngineTest
+{
+
+  @Test
+  public void testFromString()
+  {
+    Assert.assertEquals(CompactionEngine.NATIVE, CompactionEngine.fromString("native"));
+    Assert.assertEquals(CompactionEngine.MSQ, CompactionEngine.fromString("msq"));
+    Assert.assertNull(CompactionEngine.fromString(null));
+    Assert.assertThrows(IllegalArgumentException.class, () -> CompactionEngine.fromString("random"));
+  }
+
+  @Test
+  public void testToString()
+  {
+    Assert.assertEquals("native", CompactionEngine.NATIVE.toString());
+    Assert.assertEquals("msq", CompactionEngine.MSQ.toString());
+  }
+}
diff --git a/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionRunnerInfo.java b/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionRunnerInfo.java
new file mode 100644
index 00000000000..ed9e22dfaa2
--- /dev/null
+++ b/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionRunnerInfo.java
@@ -0,0 +1,216 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.client.indexing;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.indexer.CompactionEngine;
+import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
+import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
+import org.apache.druid.indexer.partitions.PartitionsSpec;
+import org.apache.druid.query.QueryContext;
+import org.apache.druid.query.aggregation.AggregatorFactory;
+import org.apache.druid.server.coordinator.CompactionConfigValidationResult;
+import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
+
+import javax.annotation.Nullable;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Map;
+import java.util.Objects;
+
+
+/**
+ * This class is just used to pass the strategy type via the "type" parameter for deserilization to appropriate
+ * {@link org.apache.druid.indexing.common.task.CompactionRunner} subtype at the overlod.
+ */
+public class ClientCompactionRunnerInfo
+{
+  private final CompactionEngine type;
+
+  @JsonCreator
+  public ClientCompactionRunnerInfo(@JsonProperty("type") CompactionEngine type)
+  {
+    this.type = type;
+  }
+
+  @JsonProperty
+  public CompactionEngine getType()
+  {
+    return type;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "ClientCompactionRunnerInfo{" +
+           "type=" + type +
+           '}';
+  }
+
+  @Override
+  public boolean equals(Object o)
+  {
+    if (this == o) {
+      return true;
+    }
+    if (o == null || getClass() != o.getClass()) {
+      return false;
+    }
+    ClientCompactionRunnerInfo that = (ClientCompactionRunnerInfo) o;
+    return type == that.type;
+  }
+
+  @Override
+  public int hashCode()
+  {
+    return Objects.hash(type);
+  }
+
+  public static CompactionConfigValidationResult validateCompactionConfig(
+      DataSourceCompactionConfig newConfig,
+      CompactionEngine defaultCompactionEngine
+  )
+  {
+    CompactionEngine compactionEngine = newConfig.getEngine() == null ? defaultCompactionEngine : newConfig.getEngine();
+    if (compactionEngine == CompactionEngine.NATIVE) {
+      return new CompactionConfigValidationResult(true, null);
+    } else {
+      return compactionConfigSupportedByMSQEngine(newConfig);
+    }
+  }
+
+  /**
+   * Checks if the provided compaction config is supported by MSQ. The following configs aren't supported:
+   * <ul>
+   * <li>partitionsSpec of type HashedParititionsSpec.</li>
+   * <li>maxTotalRows in DynamicPartitionsSpec.</li>
+   * <li>rollup set to false in granularitySpec when metricsSpec is specified. Null is treated as true.</li>
+   * <li>queryGranularity set to ALL in granularitySpec.</li>
+   * <li>Each metric has output column name same as the input name.</li>
+   * </ul>
+   */
+  private static CompactionConfigValidationResult compactionConfigSupportedByMSQEngine(DataSourceCompactionConfig newConfig)
+  {
+    List<CompactionConfigValidationResult> validationResults = new ArrayList<>();
+    if (newConfig.getTuningConfig() != null) {
+      validationResults.add(validatePartitionsSpecForMSQ(newConfig.getTuningConfig().getPartitionsSpec()));
+    }
+    if (newConfig.getGranularitySpec() != null) {
+      validationResults.add(validateRollupForMSQ(
+          newConfig.getMetricsSpec(),
+          newConfig.getGranularitySpec().isRollup()
+      ));
+    }
+    validationResults.add(validateMaxNumTasksForMSQ(newConfig.getTaskContext()));
+    validationResults.add(validateMetricsSpecForMSQ(newConfig.getMetricsSpec()));
+    return validationResults.stream()
+                            .filter(result -> !result.isValid())
+                            .findFirst()
+                            .orElse(new CompactionConfigValidationResult(true, null));
+  }
+
+  /**
+   * Validate that partitionSpec is either 'dynamic` or 'range', and if 'dynamic', ensure 'maxTotalRows' is null.
+   */
+  public static CompactionConfigValidationResult validatePartitionsSpecForMSQ(PartitionsSpec partitionsSpec)
+  {
+    if (!(partitionsSpec instanceof DimensionRangePartitionsSpec
+          || partitionsSpec instanceof DynamicPartitionsSpec)) {
+      return new CompactionConfigValidationResult(
+          false,
+          "Invalid partitionsSpec type[%s] for MSQ engine. Type must be either 'dynamic' or 'range'.",
+          partitionsSpec.getClass().getSimpleName()
+
+      );
+    }
+    if (partitionsSpec instanceof DynamicPartitionsSpec
+        && ((DynamicPartitionsSpec) partitionsSpec).getMaxTotalRows() != null) {
+      return new CompactionConfigValidationResult(
+          false,
+          "maxTotalRows[%d] in DynamicPartitionsSpec not supported for MSQ engine.",
+          ((DynamicPartitionsSpec) partitionsSpec).getMaxTotalRows()
+      );
+    }
+    return new CompactionConfigValidationResult(true, null);
+  }
+
+  /**
+   * Validate rollup is set to false in granularitySpec when metricsSpec is specified.
+   */
+  public static CompactionConfigValidationResult validateRollupForMSQ(
+      AggregatorFactory[] metricsSpec,
+      @Nullable Boolean isRollup
+  )
+  {
+    if (metricsSpec != null && isRollup != null && !isRollup) {
+      return new CompactionConfigValidationResult(
+          false,
+          "rollup in granularitySpec must be set to True if metricsSpec is specifed for MSQ engine."
+      );
+    }
+    return new CompactionConfigValidationResult(true, null);
+  }
+
+  /**
+   * Validate maxNumTasks >= 2 in context.
+   */
+  public static CompactionConfigValidationResult validateMaxNumTasksForMSQ(Map<String, Object> context)
+  {
+    if (context != null) {
+      int maxNumTasks = QueryContext.of(context)
+                                    .getInt(ClientMSQContext.CTX_MAX_NUM_TASKS, ClientMSQContext.DEFAULT_MAX_NUM_TASKS);
+      if (maxNumTasks < 2) {
+        return new CompactionConfigValidationResult(false,
+                                                    "MSQ context maxNumTasks [%,d] cannot be less than 2, "
+                                                    + "since at least 1 controller and 1 worker is necessary.",
+                                                    maxNumTasks
+        );
+      }
+    }
+    return new CompactionConfigValidationResult(true, null);
+  }
+
+  /**
+   * Validate each metric has output column name same as the input name.
+   */
+  public static CompactionConfigValidationResult validateMetricsSpecForMSQ(AggregatorFactory[] metricsSpec)
+  {
+    if (metricsSpec == null) {
+      return new CompactionConfigValidationResult(true, null);
+    }
+    return Arrays.stream(metricsSpec)
+                 .filter(aggregatorFactory ->
+                             !(aggregatorFactory.requiredFields().isEmpty()
+                               || aggregatorFactory.requiredFields().size() == 1
+                                  && aggregatorFactory.requiredFields()
+                                                      .get(0)
+                                                      .equals(aggregatorFactory.getName())))
+                 .findFirst()
+                 .map(aggregatorFactory ->
+                          new CompactionConfigValidationResult(
+                              false,
+                              "Different name[%s] and fieldName(s)[%s] for aggregator unsupported for MSQ engine.",
+                              aggregatorFactory.getName(),
+                              aggregatorFactory.requiredFields()
+                          )).orElse(new CompactionConfigValidationResult(true, null));
+  }
+}
diff --git a/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskGranularitySpec.java b/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskGranularitySpec.java
index 3ba732cfbf7..27d5b21f43d 100644
--- a/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskGranularitySpec.java
+++ b/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskGranularitySpec.java
@@ -24,6 +24,7 @@ import com.fasterxml.jackson.annotation.JsonProperty;
 import org.apache.druid.java.util.common.granularity.Granularity;
 import org.apache.druid.segment.indexing.granularity.GranularitySpec;
 
+import javax.annotation.Nullable;
 import java.util.Objects;
 
 /**
@@ -44,9 +45,9 @@ public class ClientCompactionTaskGranularitySpec
 
   @JsonCreator
   public ClientCompactionTaskGranularitySpec(
-      @JsonProperty("segmentGranularity") Granularity segmentGranularity,
-      @JsonProperty("queryGranularity") Granularity queryGranularity,
-      @JsonProperty("rollup") Boolean rollup
+      @JsonProperty("segmentGranularity") @Nullable Granularity segmentGranularity,
+      @JsonProperty("queryGranularity") @Nullable Granularity queryGranularity,
+      @JsonProperty("rollup") @Nullable Boolean rollup
   )
   {
     this.queryGranularity = queryGranularity;
@@ -55,18 +56,21 @@ public class ClientCompactionTaskGranularitySpec
   }
 
   @JsonProperty
+  @Nullable
   public Granularity getSegmentGranularity()
   {
     return segmentGranularity;
   }
 
   @JsonProperty
+  @Nullable
   public Granularity getQueryGranularity()
   {
     return queryGranularity;
   }
 
   @JsonProperty
+  @Nullable
   public Boolean isRollup()
   {
     return rollup;
diff --git a/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskQuery.java b/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskQuery.java
index 5873bd229db..d8efe4397ac 100644
--- a/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskQuery.java
+++ b/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskQuery.java
@@ -46,6 +46,7 @@ public class ClientCompactionTaskQuery implements ClientTaskQuery
   private final AggregatorFactory[] metricsSpec;
   private final ClientCompactionTaskTransformSpec transformSpec;
   private final Map<String, Object> context;
+  private final ClientCompactionRunnerInfo compactionRunner;
 
   @JsonCreator
   public ClientCompactionTaskQuery(
@@ -57,7 +58,8 @@ public class ClientCompactionTaskQuery implements ClientTaskQuery
       @JsonProperty("dimensionsSpec") ClientCompactionTaskDimensionsSpec dimensionsSpec,
       @JsonProperty("metricsSpec") AggregatorFactory[] metrics,
       @JsonProperty("transformSpec") ClientCompactionTaskTransformSpec transformSpec,
-      @JsonProperty("context") Map<String, Object> context
+      @JsonProperty("context") Map<String, Object> context,
+      @JsonProperty("compactionRunner") @Nullable ClientCompactionRunnerInfo compactionRunner
   )
   {
     this.id = Preconditions.checkNotNull(id, "id");
@@ -69,6 +71,7 @@ public class ClientCompactionTaskQuery implements ClientTaskQuery
     this.metricsSpec = metrics;
     this.transformSpec = transformSpec;
     this.context = context;
+    this.compactionRunner = compactionRunner;
   }
 
   @JsonProperty
@@ -135,6 +138,13 @@ public class ClientCompactionTaskQuery implements ClientTaskQuery
     return context;
   }
 
+  @JsonProperty("compactionRunner")
+  @Nullable
+  public ClientCompactionRunnerInfo getCompactionRunner()
+  {
+    return compactionRunner;
+  }
+
   @Override
   public boolean equals(Object o)
   {
@@ -153,7 +163,8 @@ public class ClientCompactionTaskQuery implements ClientTaskQuery
            Objects.equals(dimensionsSpec, that.dimensionsSpec) &&
            Arrays.equals(metricsSpec, that.metricsSpec) &&
            Objects.equals(transformSpec, that.transformSpec) &&
-           Objects.equals(context, that.context);
+           Objects.equals(context, that.context) &&
+           Objects.equals(compactionRunner, that.compactionRunner);
   }
 
   @Override
@@ -167,7 +178,8 @@ public class ClientCompactionTaskQuery implements ClientTaskQuery
         granularitySpec,
         dimensionsSpec,
         transformSpec,
-        context
+        context,
+        compactionRunner
     );
     result = 31 * result + Arrays.hashCode(metricsSpec);
     return result;
@@ -186,6 +198,7 @@ public class ClientCompactionTaskQuery implements ClientTaskQuery
            ", metricsSpec=" + Arrays.toString(metricsSpec) +
            ", transformSpec=" + transformSpec +
            ", context=" + context +
+           ", compactionRunner=" + compactionRunner +
            '}';
   }
 }
diff --git a/server/src/main/java/org/apache/druid/client/indexing/ClientMSQContext.java b/server/src/main/java/org/apache/druid/client/indexing/ClientMSQContext.java
new file mode 100644
index 00000000000..45279bda3ed
--- /dev/null
+++ b/server/src/main/java/org/apache/druid/client/indexing/ClientMSQContext.java
@@ -0,0 +1,35 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.client.indexing;
+
+/**
+ * This class copies over MSQ context parameters from the MSQ extension. This is required to validate the submitted
+ * compaction config at the coordinator. The values used here should be kept in sync with those in
+ * {@link org.apache.druid.msq.util.MultiStageQueryContext}
+ */
+public class ClientMSQContext
+{
+  public static final String CTX_MAX_NUM_TASKS = "maxNumTasks";
+  public static final int DEFAULT_MAX_NUM_TASKS = 2;
+  /**
+   * Limit to ensure that an MSQ compaction task doesn't take up all task slots in a cluster.
+   */
+  public static final int MAX_TASK_SLOTS_FOR_MSQ_COMPACTION_TASK = 5;
+}
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/CompactionConfigValidationResult.java b/server/src/main/java/org/apache/druid/server/coordinator/CompactionConfigValidationResult.java
new file mode 100644
index 00000000000..88eaa3e923a
--- /dev/null
+++ b/server/src/main/java/org/apache/druid/server/coordinator/CompactionConfigValidationResult.java
@@ -0,0 +1,44 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.server.coordinator;
+
+import org.apache.druid.java.util.common.StringUtils;
+
+public class CompactionConfigValidationResult
+{
+  private final boolean valid;
+  private final String reason;
+
+  public CompactionConfigValidationResult(boolean valid, String format, Object... args)
+  {
+    this.valid = valid;
+    this.reason = format == null ? null : StringUtils.format(format, args);
+  }
+
+  public boolean isValid()
+  {
+    return valid;
+  }
+
+  public String getReason()
+  {
+    return reason;
+  }
+}
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/CoordinatorCompactionConfig.java b/server/src/main/java/org/apache/druid/server/coordinator/CoordinatorCompactionConfig.java
index 2d7b6c0100a..036c53121e9 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/CoordinatorCompactionConfig.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/CoordinatorCompactionConfig.java
@@ -22,6 +22,8 @@ package org.apache.druid.server.coordinator;
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.google.common.collect.ImmutableList;
+import org.apache.druid.common.config.Configs;
+import org.apache.druid.indexer.CompactionEngine;
 
 import javax.annotation.Nullable;
 import java.util.List;
@@ -34,11 +36,13 @@ public class CoordinatorCompactionConfig
   private static final double DEFAULT_COMPACTION_TASK_RATIO = 0.1;
   private static final int DEFAULT_MAX_COMPACTION_TASK_SLOTS = Integer.MAX_VALUE;
   private static final boolean DEFAULT_USE_AUTO_SCALE_SLOTS = false;
+  private static final CompactionEngine DEFAULT_COMPACTION_ENGINE = CompactionEngine.NATIVE;
 
   private final List<DataSourceCompactionConfig> compactionConfigs;
   private final double compactionTaskSlotRatio;
   private final int maxCompactionTaskSlots;
   private final boolean useAutoScaleSlots;
+  private final CompactionEngine compactionEngine;
 
   public static CoordinatorCompactionConfig from(
       CoordinatorCompactionConfig baseConfig,
@@ -49,7 +53,8 @@ public class CoordinatorCompactionConfig
         compactionConfigs,
         baseConfig.compactionTaskSlotRatio,
         baseConfig.maxCompactionTaskSlots,
-        baseConfig.useAutoScaleSlots
+        baseConfig.useAutoScaleSlots,
+        null
     );
   }
 
@@ -64,18 +69,19 @@ public class CoordinatorCompactionConfig
         baseConfig.compactionConfigs,
         compactionTaskSlotRatio == null ? baseConfig.compactionTaskSlotRatio : compactionTaskSlotRatio,
         maxCompactionTaskSlots == null ? baseConfig.maxCompactionTaskSlots : maxCompactionTaskSlots,
-        useAutoScaleSlots == null ? baseConfig.useAutoScaleSlots : useAutoScaleSlots
+        useAutoScaleSlots == null ? baseConfig.useAutoScaleSlots : useAutoScaleSlots,
+        null
     );
   }
 
   public static CoordinatorCompactionConfig from(List<DataSourceCompactionConfig> compactionConfigs)
   {
-    return new CoordinatorCompactionConfig(compactionConfigs, null, null, null);
+    return new CoordinatorCompactionConfig(compactionConfigs, null, null, null, null);
   }
 
   public static CoordinatorCompactionConfig empty()
   {
-    return new CoordinatorCompactionConfig(ImmutableList.of(), null, null, null);
+    return new CoordinatorCompactionConfig(ImmutableList.of(), null, null, null, null);
   }
 
   @JsonCreator
@@ -83,19 +89,15 @@ public class CoordinatorCompactionConfig
       @JsonProperty("compactionConfigs") List<DataSourceCompactionConfig> compactionConfigs,
       @JsonProperty("compactionTaskSlotRatio") @Nullable Double compactionTaskSlotRatio,
       @JsonProperty("maxCompactionTaskSlots") @Nullable Integer maxCompactionTaskSlots,
-      @JsonProperty("useAutoScaleSlots") @Nullable Boolean useAutoScaleSlots
+      @JsonProperty("useAutoScaleSlots") @Nullable Boolean useAutoScaleSlots,
+      @JsonProperty("compactionEngine") @Nullable CompactionEngine compactionEngine
   )
   {
     this.compactionConfigs = compactionConfigs;
-    this.compactionTaskSlotRatio = compactionTaskSlotRatio == null ?
-                                   DEFAULT_COMPACTION_TASK_RATIO :
-                                   compactionTaskSlotRatio;
-    this.maxCompactionTaskSlots = maxCompactionTaskSlots == null ?
-                                  DEFAULT_MAX_COMPACTION_TASK_SLOTS :
-                                  maxCompactionTaskSlots;
-    this.useAutoScaleSlots = useAutoScaleSlots == null ?
-                             DEFAULT_USE_AUTO_SCALE_SLOTS :
-                             useAutoScaleSlots;
+    this.compactionTaskSlotRatio = Configs.valueOrDefault(compactionTaskSlotRatio, DEFAULT_COMPACTION_TASK_RATIO);
+    this.maxCompactionTaskSlots = Configs.valueOrDefault(maxCompactionTaskSlots, DEFAULT_MAX_COMPACTION_TASK_SLOTS);
+    this.useAutoScaleSlots = Configs.valueOrDefault(useAutoScaleSlots, DEFAULT_USE_AUTO_SCALE_SLOTS);
+    this.compactionEngine = Configs.valueOrDefault(compactionEngine, DEFAULT_COMPACTION_ENGINE);
   }
 
   @JsonProperty
@@ -122,6 +124,12 @@ public class CoordinatorCompactionConfig
     return useAutoScaleSlots;
   }
 
+  @JsonProperty
+  public CompactionEngine getEngine()
+  {
+    return compactionEngine;
+  }
+
   @Override
   public boolean equals(Object o)
   {
@@ -135,13 +143,20 @@ public class CoordinatorCompactionConfig
     return Double.compare(that.compactionTaskSlotRatio, compactionTaskSlotRatio) == 0 &&
            maxCompactionTaskSlots == that.maxCompactionTaskSlots &&
            useAutoScaleSlots == that.useAutoScaleSlots &&
+           compactionEngine == that.compactionEngine &&
            Objects.equals(compactionConfigs, that.compactionConfigs);
   }
 
   @Override
   public int hashCode()
   {
-    return Objects.hash(compactionConfigs, compactionTaskSlotRatio, maxCompactionTaskSlots, useAutoScaleSlots);
+    return Objects.hash(
+        compactionConfigs,
+        compactionTaskSlotRatio,
+        maxCompactionTaskSlots,
+        useAutoScaleSlots,
+        compactionEngine
+    );
   }
 
   @Override
@@ -152,6 +167,7 @@ public class CoordinatorCompactionConfig
            ", compactionTaskSlotRatio=" + compactionTaskSlotRatio +
            ", maxCompactionTaskSlots=" + maxCompactionTaskSlots +
            ", useAutoScaleSlots=" + useAutoScaleSlots +
+           ", compactionEngine=" + compactionEngine +
            '}';
   }
 }
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/DataSourceCompactionConfig.java b/server/src/main/java/org/apache/druid/server/coordinator/DataSourceCompactionConfig.java
index da89040f50a..767e8218f31 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/DataSourceCompactionConfig.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/DataSourceCompactionConfig.java
@@ -22,6 +22,7 @@ package org.apache.druid.server.coordinator;
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.google.common.base.Preconditions;
+import org.apache.druid.indexer.CompactionEngine;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.joda.time.Period;
 
@@ -55,6 +56,7 @@ public class DataSourceCompactionConfig
   private final UserCompactionTaskTransformConfig transformSpec;
   private final UserCompactionTaskIOConfig ioConfig;
   private final Map<String, Object> taskContext;
+  private final CompactionEngine engine;
 
   @JsonCreator
   public DataSourceCompactionConfig(
@@ -69,6 +71,7 @@ public class DataSourceCompactionConfig
       @JsonProperty("metricsSpec") @Nullable AggregatorFactory[] metricsSpec,
       @JsonProperty("transformSpec") @Nullable UserCompactionTaskTransformConfig transformSpec,
       @JsonProperty("ioConfig") @Nullable UserCompactionTaskIOConfig ioConfig,
+      @JsonProperty("engine") @Nullable CompactionEngine engine,
       @JsonProperty("taskContext") @Nullable Map<String, Object> taskContext
   )
   {
@@ -88,6 +91,7 @@ public class DataSourceCompactionConfig
     this.dimensionsSpec = dimensionsSpec;
     this.transformSpec = transformSpec;
     this.taskContext = taskContext;
+    this.engine = engine;
   }
 
   @JsonProperty
@@ -171,6 +175,13 @@ public class DataSourceCompactionConfig
     return taskContext;
   }
 
+  @JsonProperty
+  @Nullable
+  public CompactionEngine getEngine()
+  {
+    return engine;
+  }
+
   @Override
   public boolean equals(Object o)
   {
@@ -192,6 +203,7 @@ public class DataSourceCompactionConfig
            Arrays.equals(metricsSpec, that.metricsSpec) &&
            Objects.equals(transformSpec, that.transformSpec) &&
            Objects.equals(ioConfig, that.ioConfig) &&
+           this.engine == that.engine &&
            Objects.equals(taskContext, that.taskContext);
   }
 
@@ -209,7 +221,8 @@ public class DataSourceCompactionConfig
         dimensionsSpec,
         transformSpec,
         ioConfig,
-        taskContext
+        taskContext,
+        engine
     );
     result = 31 * result + Arrays.hashCode(metricsSpec);
     return result;
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java b/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java
index 335912fe23e..90fb684db6c 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java
@@ -27,15 +27,18 @@ import com.google.common.base.Predicate;
 import com.google.inject.Inject;
 import org.apache.druid.client.indexing.ClientCompactionIOConfig;
 import org.apache.druid.client.indexing.ClientCompactionIntervalSpec;
+import org.apache.druid.client.indexing.ClientCompactionRunnerInfo;
 import org.apache.druid.client.indexing.ClientCompactionTaskDimensionsSpec;
 import org.apache.druid.client.indexing.ClientCompactionTaskGranularitySpec;
 import org.apache.druid.client.indexing.ClientCompactionTaskQuery;
 import org.apache.druid.client.indexing.ClientCompactionTaskQueryTuningConfig;
 import org.apache.druid.client.indexing.ClientCompactionTaskTransformSpec;
+import org.apache.druid.client.indexing.ClientMSQContext;
 import org.apache.druid.client.indexing.ClientTaskQuery;
 import org.apache.druid.client.indexing.TaskPayloadResponse;
 import org.apache.druid.common.guava.FutureUtils;
 import org.apache.druid.common.utils.IdUtils;
+import org.apache.druid.indexer.CompactionEngine;
 import org.apache.druid.indexer.TaskStatusPlus;
 import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
 import org.apache.druid.java.util.common.ISE;
@@ -167,10 +170,17 @@ public class CompactSegments implements CoordinatorCustomDuty
       final Interval interval = compactionTaskQuery.getIoConfig().getInputSpec().getInterval();
       intervalsToSkipCompaction.computeIfAbsent(status.getDataSource(), k -> new ArrayList<>())
                                .add(interval);
-
-      busyCompactionTaskSlots += findMaxNumTaskSlotsUsedByOneCompactionTask(
-          compactionTaskQuery.getTuningConfig()
-      );
+      // Note: The default compactionRunnerType used here should match the default runner used in CompactionTask when
+      // no runner is provided there.
+      CompactionEngine compactionRunnerType = compactionTaskQuery.getCompactionRunner() == null
+                                              ? CompactionEngine.NATIVE
+                                              : compactionTaskQuery.getCompactionRunner().getType();
+      if (compactionRunnerType == CompactionEngine.NATIVE) {
+        busyCompactionTaskSlots +=
+            findMaxNumTaskSlotsUsedByOneNativeCompactionTask(compactionTaskQuery.getTuningConfig());
+      } else {
+        busyCompactionTaskSlots += findMaxNumTaskSlotsUsedByOneMsqCompactionTask(compactionTaskQuery.getContext());
+      }
     }
 
     // Skip all the intervals locked by higher priority tasks for each datasource
@@ -197,7 +207,8 @@ public class CompactSegments implements CoordinatorCustomDuty
         compactionConfigs,
         currentRunAutoCompactionSnapshotBuilders,
         availableCompactionTaskSlots,
-        iterator
+        iterator,
+        dynamicConfig.getEngine()
     );
 
     final CoordinatorRunStats stats = params.getCoordinatorStats();
@@ -234,8 +245,7 @@ public class CompactSegments implements CoordinatorCustomDuty
     Granularity configuredSegmentGranularity = dataSourceCompactionConfig.getGranularitySpec()
                                                                          .getSegmentGranularity();
     Granularity taskSegmentGranularity = compactionTaskQuery.getGranularitySpec().getSegmentGranularity();
-    if (configuredSegmentGranularity == null
-        || configuredSegmentGranularity.equals(taskSegmentGranularity)) {
+    if (configuredSegmentGranularity == null || configuredSegmentGranularity.equals(taskSegmentGranularity)) {
       return false;
     }
 
@@ -281,11 +291,13 @@ public class CompactSegments implements CoordinatorCustomDuty
   }
 
   /**
-   * Returns the maximum number of task slots used by one compaction task at any time when the task is issued with
-   * the given tuningConfig.
+   * Returns the maximum number of task slots used by one native compaction task at any time when the task is
+   * issued with the given tuningConfig.
    */
   @VisibleForTesting
-  static int findMaxNumTaskSlotsUsedByOneCompactionTask(@Nullable ClientCompactionTaskQueryTuningConfig tuningConfig)
+  static int findMaxNumTaskSlotsUsedByOneNativeCompactionTask(
+      @Nullable ClientCompactionTaskQueryTuningConfig tuningConfig
+  )
   {
     if (isParallelMode(tuningConfig)) {
       @Nullable
@@ -297,6 +309,18 @@ public class CompactSegments implements CoordinatorCustomDuty
     }
   }
 
+  /**
+   * Returns the maximum number of task slots used by one MSQ compaction task at any time when the task is
+   * issued with the given context.
+   */
+  static int findMaxNumTaskSlotsUsedByOneMsqCompactionTask(@Nullable Map<String, Object> context)
+  {
+    return context == null
+           ? ClientMSQContext.DEFAULT_MAX_NUM_TASKS
+           : (int) context.getOrDefault(ClientMSQContext.CTX_MAX_NUM_TASKS, ClientMSQContext.DEFAULT_MAX_NUM_TASKS);
+  }
+
+
   /**
    * Returns true if the compaction task can run in the parallel mode with the given tuningConfig.
    * This method should be synchronized with ParallelIndexSupervisorTask.isParallelMode(InputSource, ParallelIndexTuningConfig).
@@ -355,7 +379,8 @@ public class CompactSegments implements CoordinatorCustomDuty
       Map<String, DataSourceCompactionConfig> compactionConfigs,
       Map<String, AutoCompactionSnapshot.Builder> currentRunAutoCompactionSnapshotBuilders,
       int numAvailableCompactionTaskSlots,
-      CompactionSegmentIterator iterator
+      CompactionSegmentIterator iterator,
+      CompactionEngine defaultEngine
   )
   {
     if (numAvailableCompactionTaskSlots <= 0) {
@@ -363,9 +388,9 @@ public class CompactSegments implements CoordinatorCustomDuty
     }
 
     int numSubmittedTasks = 0;
-    int numCompactionTasksAndSubtasks = 0;
+    int totalTaskSlotsAssigned = 0;
 
-    while (iterator.hasNext() && numCompactionTasksAndSubtasks < numAvailableCompactionTaskSlots) {
+    while (iterator.hasNext() && totalTaskSlotsAssigned < numAvailableCompactionTaskSlots) {
       final SegmentsToCompact entry = iterator.next();
       final List<DataSegment> segmentsToCompact = entry.getSegments();
       if (segmentsToCompact.isEmpty()) {
@@ -465,6 +490,29 @@ public class CompactSegments implements CoordinatorCustomDuty
         }
       }
 
+      final CompactionEngine compactionEngine = config.getEngine() == null ? defaultEngine : config.getEngine();
+      final Map<String, Object> autoCompactionContext = newAutoCompactionContext(config.getTaskContext());
+      int slotsRequiredForCurrentTask;
+
+      if (compactionEngine == CompactionEngine.MSQ) {
+        if (autoCompactionContext.containsKey(ClientMSQContext.CTX_MAX_NUM_TASKS)) {
+          slotsRequiredForCurrentTask = (int) autoCompactionContext.get(ClientMSQContext.CTX_MAX_NUM_TASKS);
+        } else {
+          // Since MSQ needs all task slots for the calculated #tasks to be available upfront, allot all available
+          // compaction slots (upto a max of MAX_TASK_SLOTS_FOR_MSQ_COMPACTION) to current compaction task to avoid
+          // stalling. Setting "taskAssignment" to "auto" has the problem of not being able to determine the actual
+          // count, which is required for subsequent tasks.
+          slotsRequiredForCurrentTask = Math.min(
+              // Update the slots to 2 (min required for MSQ) if only 1 slot is available.
+              numAvailableCompactionTaskSlots == 1 ? 2 : numAvailableCompactionTaskSlots,
+              ClientMSQContext.MAX_TASK_SLOTS_FOR_MSQ_COMPACTION_TASK
+          );
+          autoCompactionContext.put(ClientMSQContext.CTX_MAX_NUM_TASKS, slotsRequiredForCurrentTask);
+        }
+      } else {
+        slotsRequiredForCurrentTask = findMaxNumTaskSlotsUsedByOneNativeCompactionTask(config.getTuningConfig());
+      }
+
       final String taskId = compactSegments(
           "coordinator-issued",
           segmentsToCompact,
@@ -479,7 +527,8 @@ public class CompactSegments implements CoordinatorCustomDuty
           config.getMetricsSpec(),
           transformSpec,
           dropExisting,
-          newAutoCompactionContext(config.getTaskContext())
+          autoCompactionContext,
+          new ClientCompactionRunnerInfo(compactionEngine)
       );
 
       LOG.info(
@@ -489,7 +538,7 @@ public class CompactSegments implements CoordinatorCustomDuty
       LOG.debugSegments(segmentsToCompact, "Compacting segments");
       // Count the compaction task itself + its sub tasks
       numSubmittedTasks++;
-      numCompactionTasksAndSubtasks += findMaxNumTaskSlotsUsedByOneCompactionTask(config.getTuningConfig());
+      totalTaskSlotsAssigned += slotsRequiredForCurrentTask;
     }
 
     LOG.info("Submitted a total of [%d] compaction tasks.", numSubmittedTasks);
@@ -628,7 +677,8 @@ public class CompactSegments implements CoordinatorCustomDuty
       @Nullable AggregatorFactory[] metricsSpec,
       @Nullable ClientCompactionTaskTransformSpec transformSpec,
       @Nullable Boolean dropExisting,
-      @Nullable Map<String, Object> context
+      @Nullable Map<String, Object> context,
+      ClientCompactionRunnerInfo compactionRunner
   )
   {
     Preconditions.checkArgument(!segments.isEmpty(), "Expect non-empty segments to compact");
@@ -656,7 +706,8 @@ public class CompactSegments implements CoordinatorCustomDuty
         dimensionsSpec,
         metricsSpec,
         transformSpec,
-        context
+        context,
+        compactionRunner
     );
     FutureUtils.getUnchecked(overlordClient.runTask(taskId, taskPayload), true);
     return taskId;
diff --git a/server/src/main/java/org/apache/druid/server/http/CoordinatorCompactionConfigsResource.java b/server/src/main/java/org/apache/druid/server/http/CoordinatorCompactionConfigsResource.java
index 57833506f09..0bba5cf63fa 100644
--- a/server/src/main/java/org/apache/druid/server/http/CoordinatorCompactionConfigsResource.java
+++ b/server/src/main/java/org/apache/druid/server/http/CoordinatorCompactionConfigsResource.java
@@ -26,9 +26,14 @@ import com.sun.jersey.spi.container.ResourceFilters;
 import org.apache.druid.audit.AuditEntry;
 import org.apache.druid.audit.AuditInfo;
 import org.apache.druid.audit.AuditManager;
+import org.apache.druid.client.indexing.ClientCompactionRunnerInfo;
 import org.apache.druid.common.config.ConfigManager.SetResult;
+import org.apache.druid.error.DruidException;
+import org.apache.druid.error.InvalidInput;
+import org.apache.druid.error.NotFound;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.server.coordinator.CompactionConfigValidationResult;
 import org.apache.druid.server.coordinator.CoordinatorCompactionConfig;
 import org.apache.druid.server.coordinator.CoordinatorConfigManager;
 import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
@@ -119,6 +124,12 @@ public class CoordinatorCompactionConfigsResource
           .getCompactionConfigs()
           .stream()
           .collect(Collectors.toMap(DataSourceCompactionConfig::getDataSource, Function.identity()));
+      CompactionConfigValidationResult validationResult =
+          ClientCompactionRunnerInfo.validateCompactionConfig(newConfig, current.getEngine());
+      if (!validationResult.isValid()) {
+        throw InvalidInput.exception("Compaction config not supported. Reason[%s].", validationResult.getReason());
+      }
+      // Don't persist config with the default engine if engine not specified, to enable update of the default.
       newConfigs.put(newConfig.getDataSource(), newConfig);
       newCompactionConfig = CoordinatorCompactionConfig.from(current, ImmutableList.copyOf(newConfigs.values()));
 
@@ -206,7 +217,7 @@ public class CoordinatorCompactionConfigsResource
 
       final DataSourceCompactionConfig config = configs.remove(dataSource);
       if (config == null) {
-        throw new NoSuchElementException("datasource not found");
+        throw NotFound.exception("datasource not found");
       }
 
       return CoordinatorCompactionConfig.from(current, ImmutableList.copyOf(configs.values()));
@@ -231,9 +242,8 @@ public class CoordinatorCompactionConfigsResource
         updateRetryDelay();
       }
     }
-    catch (NoSuchElementException e) {
-      LOG.warn(e, "Update compaction config failed");
-      return Response.status(Response.Status.NOT_FOUND).build();
+    catch (DruidException e) {
+      return ServletResourceUtils.buildErrorResponseFrom(e);
     }
     catch (Exception e) {
       LOG.warn(e, "Update compaction config failed");
diff --git a/server/src/test/java/org/apache/druid/client/indexing/ClientCompactionRunnerInfoTest.java b/server/src/test/java/org/apache/druid/client/indexing/ClientCompactionRunnerInfoTest.java
new file mode 100644
index 00000000000..f6d4a2b6e58
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/client/indexing/ClientCompactionRunnerInfoTest.java
@@ -0,0 +1,246 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.client.indexing;
+
+import com.google.common.collect.ImmutableList;
+import org.apache.druid.data.input.SegmentsSplitHintSpec;
+import org.apache.druid.indexer.CompactionEngine;
+import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
+import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
+import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
+import org.apache.druid.indexer.partitions.PartitionsSpec;
+import org.apache.druid.java.util.common.HumanReadableBytes;
+import org.apache.druid.java.util.common.granularity.Granularities;
+import org.apache.druid.query.aggregation.AggregatorFactory;
+import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
+import org.apache.druid.segment.IndexSpec;
+import org.apache.druid.segment.data.CompressionFactory;
+import org.apache.druid.segment.data.CompressionStrategy;
+import org.apache.druid.segment.writeout.TmpFileSegmentWriteOutMediumFactory;
+import org.apache.druid.server.coordinator.CompactionConfigValidationResult;
+import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
+import org.apache.druid.server.coordinator.UserCompactionTaskGranularityConfig;
+import org.apache.druid.server.coordinator.UserCompactionTaskQueryTuningConfig;
+import org.joda.time.Duration;
+import org.joda.time.Period;
+import org.junit.Assert;
+import org.junit.Test;
+
+import javax.annotation.Nullable;
+import java.util.Collections;
+import java.util.Map;
+
+public class ClientCompactionRunnerInfoTest
+{
+  @Test
+  public void testMSQEngineWithHashedPartitionsSpecIsInvalid()
+  {
+    DataSourceCompactionConfig compactionConfig = createCompactionConfig(
+        new HashedPartitionsSpec(100, null, null),
+        Collections.emptyMap(),
+        null,
+        null
+    );
+    CompactionConfigValidationResult validationResult = ClientCompactionRunnerInfo.validateCompactionConfig(
+        compactionConfig,
+        CompactionEngine.NATIVE
+    );
+    Assert.assertFalse(validationResult.isValid());
+    Assert.assertEquals(
+        "Invalid partitionsSpec type[HashedPartitionsSpec] for MSQ engine."
+        + " Type must be either 'dynamic' or 'range'.",
+        validationResult.getReason()
+    );
+  }
+
+  @Test
+  public void testMSQEngineWithMaxTotalRowsIsInvalid()
+  {
+    DataSourceCompactionConfig compactionConfig = createCompactionConfig(
+        new DynamicPartitionsSpec(100, 100L),
+        Collections.emptyMap(),
+        null,
+        null
+    );
+    CompactionConfigValidationResult validationResult = ClientCompactionRunnerInfo.validateCompactionConfig(
+        compactionConfig,
+        CompactionEngine.NATIVE
+    );
+    Assert.assertFalse(validationResult.isValid());
+    Assert.assertEquals(
+        "maxTotalRows[100] in DynamicPartitionsSpec not supported for MSQ engine.",
+        validationResult.getReason()
+    );
+  }
+
+  @Test
+  public void testMSQEngineWithDynamicPartitionsSpecIsValid()
+  {
+    DataSourceCompactionConfig compactionConfig = createCompactionConfig(
+        new DynamicPartitionsSpec(100, null),
+        Collections.emptyMap(),
+        null,
+        null
+    );
+    Assert.assertTrue(ClientCompactionRunnerInfo.validateCompactionConfig(compactionConfig, CompactionEngine.NATIVE)
+                                         .isValid());
+  }
+
+  @Test
+  public void testMSQEngineWithDimensionRangePartitionsSpecIsValid()
+  {
+    DataSourceCompactionConfig compactionConfig = createCompactionConfig(
+        new DimensionRangePartitionsSpec(100, null, ImmutableList.of("partitionDim"), false),
+        Collections.emptyMap(),
+        null,
+        null
+    );
+    Assert.assertTrue(ClientCompactionRunnerInfo.validateCompactionConfig(compactionConfig, CompactionEngine.NATIVE)
+                                         .isValid());
+  }
+
+  @Test
+  public void testMSQEngineWithQueryGranularityAllIsValid()
+  {
+    DataSourceCompactionConfig compactionConfig = createCompactionConfig(
+        new DynamicPartitionsSpec(3, null),
+        Collections.emptyMap(),
+        new UserCompactionTaskGranularityConfig(Granularities.ALL, Granularities.ALL, false),
+        null
+    );
+    Assert.assertTrue(ClientCompactionRunnerInfo.validateCompactionConfig(compactionConfig, CompactionEngine.NATIVE)
+                                          .isValid());
+  }
+
+  @Test
+  public void testMSQEngineWithRollupFalseWithMetricsSpecIsInValid()
+  {
+    DataSourceCompactionConfig compactionConfig = createCompactionConfig(
+        new DynamicPartitionsSpec(3, null),
+        Collections.emptyMap(),
+        new UserCompactionTaskGranularityConfig(null, null, false),
+        new AggregatorFactory[]{new LongSumAggregatorFactory("sum", "sum")}
+    );
+    CompactionConfigValidationResult validationResult = ClientCompactionRunnerInfo.validateCompactionConfig(
+        compactionConfig,
+        CompactionEngine.NATIVE
+    );
+    Assert.assertFalse(validationResult.isValid());
+    Assert.assertEquals(
+        "rollup in granularitySpec must be set to True if metricsSpec is specifed for MSQ engine.",
+        validationResult.getReason()
+    );
+  }
+
+  @Test
+  public void testMSQEngineWithUnsupportedMetricsSpecIsInValid()
+  {
+    // Aggregators having different input and ouput column names are unsupported.
+    final String inputColName = "added";
+    final String outputColName = "sum_added";
+    DataSourceCompactionConfig compactionConfig = createCompactionConfig(
+        new DynamicPartitionsSpec(3, null),
+        Collections.emptyMap(),
+        new UserCompactionTaskGranularityConfig(null, null, null),
+        new AggregatorFactory[]{new LongSumAggregatorFactory(outputColName, inputColName)}
+    );
+    CompactionConfigValidationResult validationResult = ClientCompactionRunnerInfo.validateCompactionConfig(
+        compactionConfig,
+        CompactionEngine.NATIVE
+    );
+    Assert.assertFalse(validationResult.isValid());
+    Assert.assertEquals(
+        "Different name[sum_added] and fieldName(s)[[added]] for aggregator unsupported for MSQ engine.",
+        validationResult.getReason()
+    );
+  }
+
+  @Test
+  public void testMSQEngineWithRollupNullWithMetricsSpecIsValid()
+  {
+    DataSourceCompactionConfig compactionConfig = createCompactionConfig(
+        new DynamicPartitionsSpec(3, null),
+        Collections.emptyMap(),
+        new UserCompactionTaskGranularityConfig(null, null, null),
+        new AggregatorFactory[]{new LongSumAggregatorFactory("sum", "sum")}
+    );
+    Assert.assertTrue(ClientCompactionRunnerInfo.validateCompactionConfig(compactionConfig, CompactionEngine.NATIVE)
+                                         .isValid());
+  }
+
+  private static DataSourceCompactionConfig createCompactionConfig(
+      PartitionsSpec partitionsSpec,
+      Map<String, Object> context,
+      @Nullable UserCompactionTaskGranularityConfig granularitySpec,
+      @Nullable AggregatorFactory[] metricsSpec
+  )
+  {
+    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
+        "dataSource",
+        null,
+        500L,
+        10000,
+        new Period(3600),
+        createTuningConfig(partitionsSpec),
+        granularitySpec,
+        null,
+        metricsSpec,
+        null,
+        null,
+        CompactionEngine.MSQ,
+        context
+    );
+    return config;
+  }
+
+  private static UserCompactionTaskQueryTuningConfig createTuningConfig(PartitionsSpec partitionsSpec)
+  {
+    final UserCompactionTaskQueryTuningConfig tuningConfig = new UserCompactionTaskQueryTuningConfig(
+        40000,
+        null,
+        2000L,
+        null,
+        new SegmentsSplitHintSpec(new HumanReadableBytes(100000L), null),
+        partitionsSpec,
+        IndexSpec.builder()
+                 .withDimensionCompression(CompressionStrategy.LZ4)
+                 .withMetricCompression(CompressionStrategy.LZF)
+                 .withLongEncoding(CompressionFactory.LongEncodingStrategy.LONGS)
+                 .build(),
+        IndexSpec.builder()
+                 .withDimensionCompression(CompressionStrategy.LZ4)
+                 .withMetricCompression(CompressionStrategy.UNCOMPRESSED)
+                 .withLongEncoding(CompressionFactory.LongEncodingStrategy.AUTO)
+                 .build(),
+        2,
+        1000L,
+        TmpFileSegmentWriteOutMediumFactory.instance(),
+        100,
+        5,
+        1000L,
+        new Duration(3000L),
+        7,
+        1000,
+        100,
+        2
+    );
+    return tuningConfig;
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/DataSourceCompactionConfigTest.java b/server/src/test/java/org/apache/druid/server/coordinator/DataSourceCompactionConfigTest.java
index e3f8c01c3dc..a9334f077a4 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/DataSourceCompactionConfigTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/DataSourceCompactionConfigTest.java
@@ -25,6 +25,7 @@ import com.google.common.collect.ImmutableMap;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.SegmentsSplitHintSpec;
 import org.apache.druid.data.input.impl.DimensionsSpec;
+import org.apache.druid.indexer.CompactionEngine;
 import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.HumanReadableBytes;
@@ -69,6 +70,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -82,6 +84,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
     Assert.assertEquals(config.getTuningConfig(), fromJson.getTuningConfig());
     Assert.assertEquals(config.getTaskContext(), fromJson.getTaskContext());
     Assert.assertEquals(config.getGranularitySpec(), fromJson.getGranularitySpec());
+    Assert.assertEquals(config.getEngine(), fromJson.getEngine());
   }
 
   @Test
@@ -99,6 +102,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        CompactionEngine.MSQ,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -111,6 +115,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
     Assert.assertEquals(config.getSkipOffsetFromLatest(), fromJson.getSkipOffsetFromLatest());
     Assert.assertEquals(config.getTuningConfig(), fromJson.getTuningConfig());
     Assert.assertEquals(config.getTaskContext(), fromJson.getTaskContext());
+    Assert.assertEquals(config.getEngine(), fromJson.getEngine());
   }
 
   @Test
@@ -148,6 +153,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        CompactionEngine.NATIVE,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -160,6 +166,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
     Assert.assertEquals(config.getSkipOffsetFromLatest(), fromJson.getSkipOffsetFromLatest());
     Assert.assertEquals(config.getTuningConfig(), fromJson.getTuningConfig());
     Assert.assertEquals(config.getTaskContext(), fromJson.getTaskContext());
+    Assert.assertEquals(config.getEngine(), fromJson.getEngine());
   }
 
   @Test
@@ -197,6 +204,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
 
@@ -305,6 +313,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -335,6 +344,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -368,6 +378,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -398,6 +409,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -428,6 +440,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -461,6 +474,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         new UserCompactionTaskIOConfig(true),
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -492,6 +506,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         new UserCompactionTaskIOConfig(null),
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -523,6 +538,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -554,6 +570,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         null,
         new UserCompactionTaskTransformConfig(new SelectorDimFilter("dim1", "foo", null)),
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
@@ -584,6 +601,7 @@ public class DataSourceCompactionConfigTest extends InitializedNullHandlingTest
         new AggregatorFactory[] {new CountAggregatorFactory("cnt")},
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final String json = OBJECT_MAPPER.writeValueAsString(config);
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIteratorTest.java b/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIteratorTest.java
index b4ea5d69e00..9c96e6fcdd8 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIteratorTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIteratorTest.java
@@ -96,6 +96,7 @@ public class NewestSegmentFirstIteratorTest
         null,
         null,
         null,
+        null,
         null
     );
     Assert.assertEquals(
@@ -141,6 +142,7 @@ public class NewestSegmentFirstIteratorTest
         null,
         null,
         null,
+        null,
         null
     );
     Assert.assertEquals(
@@ -186,6 +188,7 @@ public class NewestSegmentFirstIteratorTest
         null,
         null,
         null,
+        null,
         null
     );
     Assert.assertEquals(
@@ -231,6 +234,7 @@ public class NewestSegmentFirstIteratorTest
         null,
         null,
         null,
+        null,
         null
     );
     Assert.assertEquals(
@@ -276,6 +280,7 @@ public class NewestSegmentFirstIteratorTest
         null,
         null,
         null,
+        null,
         null
     );
     Assert.assertEquals(
@@ -321,6 +326,7 @@ public class NewestSegmentFirstIteratorTest
         null,
         null,
         null,
+        null,
         null
     );
     Assert.assertEquals(
@@ -366,6 +372,7 @@ public class NewestSegmentFirstIteratorTest
         null,
         null,
         null,
+        null,
         null
     );
     Assert.assertEquals(
@@ -411,6 +418,7 @@ public class NewestSegmentFirstIteratorTest
         null,
         null,
         null,
+        null,
         null
     );
     Assert.assertEquals(
@@ -456,6 +464,7 @@ public class NewestSegmentFirstIteratorTest
         null,
         null,
         null,
+        null,
         null
     );
     Assert.assertEquals(
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicyTest.java b/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicyTest.java
index dda1cb1af13..31e269f50f4 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicyTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicyTest.java
@@ -2023,6 +2023,7 @@ public class NewestSegmentFirstPolicyTest
         metricsSpec,
         transformSpec,
         null,
+        null,
         null
     );
   }
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/duty/CompactSegmentsTest.java b/server/src/test/java/org/apache/druid/server/coordinator/duty/CompactSegmentsTest.java
index 173e4537cca..236cfaf7da5 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/duty/CompactSegmentsTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/duty/CompactSegmentsTest.java
@@ -36,12 +36,14 @@ import org.apache.druid.client.indexing.ClientCompactionIntervalSpec;
 import org.apache.druid.client.indexing.ClientCompactionTaskGranularitySpec;
 import org.apache.druid.client.indexing.ClientCompactionTaskQuery;
 import org.apache.druid.client.indexing.ClientCompactionTaskQueryTuningConfig;
+import org.apache.druid.client.indexing.ClientMSQContext;
 import org.apache.druid.client.indexing.ClientTaskQuery;
 import org.apache.druid.client.indexing.IndexingTotalWorkerCapacityInfo;
 import org.apache.druid.client.indexing.NoopOverlordClient;
 import org.apache.druid.client.indexing.TaskPayloadResponse;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.impl.DimensionsSpec;
+import org.apache.druid.indexer.CompactionEngine;
 import org.apache.druid.indexer.RunnerTaskState;
 import org.apache.druid.indexer.TaskLocation;
 import org.apache.druid.indexer.TaskState;
@@ -130,50 +132,63 @@ public class CompactSegmentsTest
   private static final int MAXIMUM_CAPACITY_WITH_AUTO_SCALE = 10;
   private static final NewestSegmentFirstPolicy SEARCH_POLICY = new NewestSegmentFirstPolicy(JSON_MAPPER);
 
-  @Parameterized.Parameters(name = "{0}")
+  @Parameterized.Parameters(name = "scenario: {0}, engine: {2}")
   public static Collection<Object[]> constructorFeeder()
   {
     final MutableInt nextRangePartitionBoundary = new MutableInt(0);
+
+    final DynamicPartitionsSpec dynamicPartitionsSpec = new DynamicPartitionsSpec(300000, Long.MAX_VALUE);
+    final BiFunction<Integer, Integer, ShardSpec> numberedShardSpecCreator = NumberedShardSpec::new;
+
+    final HashedPartitionsSpec hashedPartitionsSpec = new HashedPartitionsSpec(null, 2, ImmutableList.of("dim"));
+    final BiFunction<Integer, Integer, ShardSpec> hashBasedNumberedShardSpecCreator =
+        (bucketId, numBuckets) -> new HashBasedNumberedShardSpec(
+            bucketId,
+            numBuckets,
+            bucketId,
+            numBuckets,
+            ImmutableList.of("dim"),
+            null,
+            JSON_MAPPER
+        );
+
+    final SingleDimensionPartitionsSpec singleDimensionPartitionsSpec =
+        new SingleDimensionPartitionsSpec(300000, null, "dim", false);
+    final BiFunction<Integer, Integer, ShardSpec> singleDimensionShardSpecCreator =
+        (bucketId, numBuckets) -> new SingleDimensionShardSpec(
+            "dim",
+            bucketId == 0 ? null : String.valueOf(nextRangePartitionBoundary.getAndIncrement()),
+            bucketId.equals(numBuckets) ? null : String.valueOf(nextRangePartitionBoundary.getAndIncrement()),
+            bucketId,
+            numBuckets
+        );
+
+    // Hash partition spec is not supported by MSQ engine.
     return ImmutableList.of(
-        new Object[]{
-            new DynamicPartitionsSpec(300000, Long.MAX_VALUE),
-            (BiFunction<Integer, Integer, ShardSpec>) NumberedShardSpec::new
-        },
-        new Object[]{
-            new HashedPartitionsSpec(null, 2, ImmutableList.of("dim")),
-            (BiFunction<Integer, Integer, ShardSpec>) (bucketId, numBuckets) -> new HashBasedNumberedShardSpec(
-                bucketId,
-                numBuckets,
-                bucketId,
-                numBuckets,
-                ImmutableList.of("dim"),
-                null,
-                JSON_MAPPER
-            )
-        },
-        new Object[]{
-            new SingleDimensionPartitionsSpec(300000, null, "dim", false),
-            (BiFunction<Integer, Integer, ShardSpec>) (bucketId, numBuckets) -> new SingleDimensionShardSpec(
-                "dim",
-                bucketId == 0 ? null : String.valueOf(nextRangePartitionBoundary.getAndIncrement()),
-                bucketId.equals(numBuckets) ? null : String.valueOf(nextRangePartitionBoundary.getAndIncrement()),
-                bucketId,
-                numBuckets
-            )
-        }
+        new Object[]{dynamicPartitionsSpec, numberedShardSpecCreator, CompactionEngine.NATIVE},
+        new Object[]{hashedPartitionsSpec, hashBasedNumberedShardSpecCreator, CompactionEngine.NATIVE},
+        new Object[]{singleDimensionPartitionsSpec, singleDimensionShardSpecCreator, CompactionEngine.NATIVE},
+        new Object[]{dynamicPartitionsSpec, numberedShardSpecCreator, CompactionEngine.MSQ},
+        new Object[]{singleDimensionPartitionsSpec, singleDimensionShardSpecCreator, CompactionEngine.MSQ}
     );
   }
 
   private final PartitionsSpec partitionsSpec;
   private final BiFunction<Integer, Integer, ShardSpec> shardSpecFactory;
+  private final CompactionEngine engine;
 
   private DataSourcesSnapshot dataSources;
   Map<String, List<DataSegment>> datasourceToSegments = new HashMap<>();
 
-  public CompactSegmentsTest(PartitionsSpec partitionsSpec, BiFunction<Integer, Integer, ShardSpec> shardSpecFactory)
+  public CompactSegmentsTest(
+      PartitionsSpec partitionsSpec,
+      BiFunction<Integer, Integer, ShardSpec> shardSpecFactory,
+      CompactionEngine engine
+  )
   {
     this.partitionsSpec = partitionsSpec;
     this.shardSpecFactory = shardSpecFactory;
+    this.engine = engine;
   }
 
   @Before
@@ -640,7 +655,13 @@ public class CompactSegmentsTest
     final CoordinatorRunStats stats = doCompactSegments(compactSegments, 3);
     Assert.assertEquals(3, stats.get(Stats.Compaction.AVAILABLE_SLOTS));
     Assert.assertEquals(3, stats.get(Stats.Compaction.MAX_SLOTS));
-    Assert.assertEquals(3, stats.get(Stats.Compaction.SUBMITTED_TASKS));
+    // Native takes up 1 task slot by default whereas MSQ takes up all available upto 5. Since there are 3 available
+    // slots, there are 3 submitted tasks for native whereas 1 for MSQ.
+    if (engine == CompactionEngine.NATIVE) {
+      Assert.assertEquals(3, stats.get(Stats.Compaction.SUBMITTED_TASKS));
+    } else {
+      Assert.assertEquals(1, stats.get(Stats.Compaction.SUBMITTED_TASKS));
+    }
   }
 
   @Test
@@ -654,7 +675,13 @@ public class CompactSegmentsTest
         doCompactSegments(compactSegments, createCompactionConfigs(), maxCompactionSlot, true);
     Assert.assertEquals(maxCompactionSlot, stats.get(Stats.Compaction.AVAILABLE_SLOTS));
     Assert.assertEquals(maxCompactionSlot, stats.get(Stats.Compaction.MAX_SLOTS));
-    Assert.assertEquals(maxCompactionSlot, stats.get(Stats.Compaction.SUBMITTED_TASKS));
+    // Native takes up 1 task slot by default whereas MSQ takes up all available upto 5. Since there are 3 available
+    // slots, there are 3 submitted tasks for native whereas 1 for MSQ.
+    if (engine == CompactionEngine.NATIVE) {
+      Assert.assertEquals(maxCompactionSlot, stats.get(Stats.Compaction.SUBMITTED_TASKS));
+    } else {
+      Assert.assertEquals(1, stats.get(Stats.Compaction.SUBMITTED_TASKS));
+    }
   }
 
   @Test
@@ -668,7 +695,16 @@ public class CompactSegmentsTest
         doCompactSegments(compactSegments, createCompactionConfigs(), maxCompactionSlot, true);
     Assert.assertEquals(MAXIMUM_CAPACITY_WITH_AUTO_SCALE, stats.get(Stats.Compaction.AVAILABLE_SLOTS));
     Assert.assertEquals(MAXIMUM_CAPACITY_WITH_AUTO_SCALE, stats.get(Stats.Compaction.MAX_SLOTS));
-    Assert.assertEquals(MAXIMUM_CAPACITY_WITH_AUTO_SCALE, stats.get(Stats.Compaction.SUBMITTED_TASKS));
+    // Native takes up 1 task slot by default whereas MSQ takes up all available upto 5. Since there are 10 available
+    // slots, there are 10 submitted tasks for native whereas 2 for MSQ.
+    if (engine == CompactionEngine.NATIVE) {
+      Assert.assertEquals(MAXIMUM_CAPACITY_WITH_AUTO_SCALE, stats.get(Stats.Compaction.SUBMITTED_TASKS));
+    } else {
+      Assert.assertEquals(
+          MAXIMUM_CAPACITY_WITH_AUTO_SCALE / ClientMSQContext.MAX_TASK_SLOTS_FOR_MSQ_COMPACTION_TASK,
+          stats.get(Stats.Compaction.SUBMITTED_TASKS)
+      );
+    }
   }
 
   @Test
@@ -712,6 +748,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -769,6 +806,7 @@ public class CompactSegmentsTest
             null,
             null,
             new UserCompactionTaskIOConfig(true),
+            engine,
             null
         )
     );
@@ -818,6 +856,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -867,6 +906,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -927,6 +967,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -979,6 +1020,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -1028,6 +1070,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -1081,6 +1124,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            null,
             null
         )
     );
@@ -1137,6 +1181,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -1165,8 +1210,13 @@ public class CompactSegmentsTest
   {
     final TestOverlordClient overlordClient = new TestOverlordClient(JSON_MAPPER);
     final CompactSegments compactSegments = new CompactSegments(SEARCH_POLICY, overlordClient);
-
-    final CoordinatorRunStats stats = doCompactSegments(compactSegments, createCompactionConfigs(2), 4);
+    final CoordinatorRunStats stats;
+    // Native uses maxNumConcurrentSubTasks for task slots whereas MSQ uses maxNumTasks.
+    if (engine == CompactionEngine.NATIVE) {
+      stats = doCompactSegments(compactSegments, createcompactionConfigsForNative(2), 4);
+    } else {
+      stats = doCompactSegments(compactSegments, createcompactionConfigsForMSQ(2), 4);
+    }
     Assert.assertEquals(4, stats.get(Stats.Compaction.AVAILABLE_SLOTS));
     Assert.assertEquals(4, stats.get(Stats.Compaction.MAX_SLOTS));
     Assert.assertEquals(2, stats.get(Stats.Compaction.SUBMITTED_TASKS));
@@ -1198,7 +1248,7 @@ public class CompactSegmentsTest
     // is submitted for dataSource_0
     CompactSegments compactSegments = new CompactSegments(SEARCH_POLICY, overlordClient);
     final CoordinatorRunStats stats =
-        doCompactSegments(compactSegments, createCompactionConfigs(2), 4);
+        doCompactSegments(compactSegments, createcompactionConfigsForNative(2), 4);
     Assert.assertEquals(1, stats.get(Stats.Compaction.SUBMITTED_TASKS));
     Assert.assertEquals(1, overlordClient.submittedCompactionTasks.size());
 
@@ -1252,6 +1302,7 @@ public class CompactSegmentsTest
             null,
             new UserCompactionTaskTransformConfig(new SelectorDimFilter("dim1", "foo", null)),
             null,
+            engine,
             null
         )
     );
@@ -1302,6 +1353,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -1354,6 +1406,7 @@ public class CompactSegmentsTest
             aggregatorFactories,
             null,
             null,
+            engine,
             null
         )
     );
@@ -1434,6 +1487,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -1520,6 +1574,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -1577,6 +1632,7 @@ public class CompactSegmentsTest
             new AggregatorFactory[] {new CountAggregatorFactory("cnt")},
             null,
             null,
+            engine,
             null
         )
     );
@@ -1629,6 +1685,7 @@ public class CompactSegmentsTest
             null,
             null,
             null,
+            engine,
             null
         )
     );
@@ -1781,7 +1838,8 @@ public class CompactSegmentsTest
                 compactionConfigs,
                 numCompactionTaskSlots == null ? null : 1.0, // 100% when numCompactionTaskSlots is not null
                 numCompactionTaskSlots,
-                useAutoScaleSlots
+                useAutoScaleSlots,
+                null
             )
         )
         .build();
@@ -1901,10 +1959,23 @@ public class CompactSegmentsTest
 
   private List<DataSourceCompactionConfig> createCompactionConfigs()
   {
-    return createCompactionConfigs(null);
+    return createCompactionConfigs(null, null);
   }
 
-  private List<DataSourceCompactionConfig> createCompactionConfigs(@Nullable Integer maxNumConcurrentSubTasks)
+  private List<DataSourceCompactionConfig> createcompactionConfigsForNative(@Nullable Integer maxNumConcurrentSubTasks)
+  {
+    return createCompactionConfigs(maxNumConcurrentSubTasks, null);
+  }
+
+  private List<DataSourceCompactionConfig> createcompactionConfigsForMSQ(Integer maxNumTasks)
+  {
+    return createCompactionConfigs(null, maxNumTasks);
+  }
+
+  private List<DataSourceCompactionConfig> createCompactionConfigs(
+      @Nullable Integer maxNumConcurrentSubTasksForNative,
+      @Nullable Integer maxNumTasksForMSQ
+  )
   {
     final List<DataSourceCompactionConfig> compactionConfigs = new ArrayList<>();
     for (int i = 0; i < 3; i++) {
@@ -1928,7 +1999,7 @@ public class CompactSegmentsTest
                   null,
                   null,
                   null,
-                  maxNumConcurrentSubTasks,
+                  maxNumConcurrentSubTasksForNative,
                   null,
                   null,
                   null,
@@ -1942,7 +2013,8 @@ public class CompactSegmentsTest
               null,
               null,
               null,
-              null
+              engine,
+              maxNumTasksForMSQ == null ? null : ImmutableMap.of(ClientMSQContext.CTX_MAX_NUM_TASKS, maxNumTasksForMSQ)
           )
       );
     }
@@ -2172,7 +2244,7 @@ public class CompactSegmentsTest
       ClientCompactionTaskQueryTuningConfig tuningConfig = Mockito.mock(ClientCompactionTaskQueryTuningConfig.class);
       Mockito.when(tuningConfig.getPartitionsSpec()).thenReturn(Mockito.mock(PartitionsSpec.class));
       Mockito.when(tuningConfig.getMaxNumConcurrentSubTasks()).thenReturn(2);
-      Assert.assertEquals(3, CompactSegments.findMaxNumTaskSlotsUsedByOneCompactionTask(tuningConfig));
+      Assert.assertEquals(3, CompactSegments.findMaxNumTaskSlotsUsedByOneNativeCompactionTask(tuningConfig));
     }
 
     @Test
@@ -2181,7 +2253,7 @@ public class CompactSegmentsTest
       ClientCompactionTaskQueryTuningConfig tuningConfig = Mockito.mock(ClientCompactionTaskQueryTuningConfig.class);
       Mockito.when(tuningConfig.getPartitionsSpec()).thenReturn(Mockito.mock(PartitionsSpec.class));
       Mockito.when(tuningConfig.getMaxNumConcurrentSubTasks()).thenReturn(1);
-      Assert.assertEquals(1, CompactSegments.findMaxNumTaskSlotsUsedByOneCompactionTask(tuningConfig));
+      Assert.assertEquals(1, CompactSegments.findMaxNumTaskSlotsUsedByOneNativeCompactionTask(tuningConfig));
     }
   }
 
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/duty/KillCompactionConfigTest.java b/server/src/test/java/org/apache/druid/server/coordinator/duty/KillCompactionConfigTest.java
index ec4547c940c..3d441d9b06d 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/duty/KillCompactionConfigTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/duty/KillCompactionConfigTest.java
@@ -158,6 +158,7 @@ public class KillCompactionConfigTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
 
@@ -173,6 +174,7 @@ public class KillCompactionConfigTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     CoordinatorCompactionConfig originalCurrentConfig = CoordinatorCompactionConfig.from(ImmutableList.of(inactiveDatasourceConfig, activeDatasourceConfig));
@@ -255,6 +257,7 @@ public class KillCompactionConfigTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
 
diff --git a/server/src/test/java/org/apache/druid/server/http/CoordinatorCompactionConfigsResourceTest.java b/server/src/test/java/org/apache/druid/server/http/CoordinatorCompactionConfigsResourceTest.java
index c31364ac9fd..17db2285477 100644
--- a/server/src/test/java/org/apache/druid/server/http/CoordinatorCompactionConfigsResourceTest.java
+++ b/server/src/test/java/org/apache/druid/server/http/CoordinatorCompactionConfigsResourceTest.java
@@ -22,8 +22,12 @@ package org.apache.druid.server.http;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import org.apache.druid.audit.AuditManager;
+import org.apache.druid.client.indexing.ClientMSQContext;
 import org.apache.druid.common.config.ConfigManager;
 import org.apache.druid.common.config.JacksonConfigManager;
+import org.apache.druid.error.DruidException;
+import org.apache.druid.error.ErrorResponse;
+import org.apache.druid.indexer.CompactionEngine;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.metadata.MetadataStorageConnector;
@@ -62,6 +66,7 @@ public class CoordinatorCompactionConfigsResourceTest
       null,
       null,
       null,
+      null,
       ImmutableMap.of("key", "val")
   );
   private static final DataSourceCompactionConfig NEW_CONFIG = new DataSourceCompactionConfig(
@@ -76,6 +81,7 @@ public class CoordinatorCompactionConfigsResourceTest
       null,
       null,
       null,
+      null,
       ImmutableMap.of("key", "val")
   );
   private static final byte[] OLD_CONFIG_IN_BYTES = {1, 2, 3};
@@ -189,6 +195,7 @@ public class CoordinatorCompactionConfigsResourceTest
         null,
         null,
         null,
+        CompactionEngine.NATIVE,
         ImmutableMap.of("key", "val")
     );
     Response result = coordinatorCompactionConfigsResource.addOrUpdateCompactionConfig(
@@ -202,6 +209,7 @@ public class CoordinatorCompactionConfigsResourceTest
     Assert.assertEquals(2, newConfigCaptor.getValue().getCompactionConfigs().size());
     Assert.assertEquals(OLD_CONFIG, newConfigCaptor.getValue().getCompactionConfigs().get(0));
     Assert.assertEquals(newConfig, newConfigCaptor.getValue().getCompactionConfigs().get(1));
+    Assert.assertEquals(newConfig.getEngine(), newConfigCaptor.getValue().getEngine());
   }
 
   @Test
@@ -230,6 +238,7 @@ public class CoordinatorCompactionConfigsResourceTest
         null,
         null,
         null,
+        null,
         ImmutableMap.of("key", "val")
     );
     final CoordinatorCompactionConfig originalConfig = CoordinatorCompactionConfig.from(ImmutableList.of(toDelete));
@@ -388,6 +397,7 @@ public class CoordinatorCompactionConfigsResourceTest
         null,
         null,
         null,
+        CompactionEngine.MSQ,
         ImmutableMap.of("key", "val")
     );
     String author = "maytas";
@@ -401,6 +411,102 @@ public class CoordinatorCompactionConfigsResourceTest
     Assert.assertNotNull(newConfigCaptor.getValue());
     Assert.assertEquals(1, newConfigCaptor.getValue().getCompactionConfigs().size());
     Assert.assertEquals(newConfig, newConfigCaptor.getValue().getCompactionConfigs().get(0));
+    Assert.assertEquals(newConfig.getEngine(), newConfigCaptor.getValue().getCompactionConfigs().get(0).getEngine());
+  }
+
+  @Test
+  public void testAddOrUpdateCompactionConfigWithoutExistingConfigAndEngineAsNull()
+  {
+    Mockito.when(mockConnector.lookup(
+                     ArgumentMatchers.anyString(),
+                     ArgumentMatchers.eq("name"),
+                     ArgumentMatchers.eq("payload"),
+                     ArgumentMatchers.eq(CoordinatorCompactionConfig.CONFIG_KEY)
+                 )
+    ).thenReturn(null);
+    Mockito.when(mockJacksonConfigManager.convertByteToConfig(
+                     ArgumentMatchers.eq(null),
+                     ArgumentMatchers.eq(CoordinatorCompactionConfig.class),
+                     ArgumentMatchers.eq(CoordinatorCompactionConfig.empty())
+                 )
+    ).thenReturn(CoordinatorCompactionConfig.empty());
+    final ArgumentCaptor<byte[]> oldConfigCaptor = ArgumentCaptor.forClass(byte[].class);
+    final ArgumentCaptor<CoordinatorCompactionConfig> newConfigCaptor = ArgumentCaptor.forClass(
+        CoordinatorCompactionConfig.class);
+    Mockito.when(mockJacksonConfigManager.set(
+                     ArgumentMatchers.eq(CoordinatorCompactionConfig.CONFIG_KEY),
+                     oldConfigCaptor.capture(),
+                     newConfigCaptor.capture(),
+                     ArgumentMatchers.any()
+                 )
+    ).thenReturn(ConfigManager.SetResult.ok());
+
+    final DataSourceCompactionConfig newConfig = new DataSourceCompactionConfig(
+        "dataSource",
+        null,
+        500L,
+        null,
+        new Period(3600),
+        null,
+        new UserCompactionTaskGranularityConfig(Granularities.HOUR, null, null),
+        null,
+        null,
+        null,
+        null,
+        null,
+        ImmutableMap.of("key", "val")
+    );
+    coordinatorCompactionConfigsResource.addOrUpdateCompactionConfig(
+        newConfig,
+        mockHttpServletRequest
+    );
+    Assert.assertEquals(null, newConfigCaptor.getValue().getCompactionConfigs().get(0).getEngine());
+  }
+
+  @Test
+  public void testAddOrUpdateCompactionConfigWithInvalidMaxNumTasksForMSQEngine()
+  {
+    Mockito.when(mockConnector.lookup(
+                     ArgumentMatchers.anyString(),
+                     ArgumentMatchers.eq("name"),
+                     ArgumentMatchers.eq("payload"),
+                     ArgumentMatchers.eq(CoordinatorCompactionConfig.CONFIG_KEY)
+                 )
+    ).thenReturn(null);
+    Mockito.when(mockJacksonConfigManager.convertByteToConfig(
+                     ArgumentMatchers.eq(null),
+                     ArgumentMatchers.eq(CoordinatorCompactionConfig.class),
+                     ArgumentMatchers.eq(CoordinatorCompactionConfig.empty())
+                 )
+    ).thenReturn(CoordinatorCompactionConfig.empty());
+
+    int maxNumTasks = 1;
+
+    final DataSourceCompactionConfig newConfig = new DataSourceCompactionConfig(
+        "dataSource",
+        null,
+        500L,
+        null,
+        new Period(3600),
+        null,
+        new UserCompactionTaskGranularityConfig(Granularities.HOUR, null, null),
+        null,
+        null,
+        null,
+        null,
+        CompactionEngine.MSQ,
+        ImmutableMap.of(ClientMSQContext.CTX_MAX_NUM_TASKS, maxNumTasks)
+    );
+    Response response = coordinatorCompactionConfigsResource.addOrUpdateCompactionConfig(
+        newConfig,
+        mockHttpServletRequest
+    );
+    Assert.assertEquals(DruidException.Category.INVALID_INPUT.getExpectedStatus(), response.getStatus());
+    Assert.assertEquals(
+        "Compaction config not supported. Reason[MSQ context maxNumTasks [1] cannot be less than 2, "
+        + "since at least 1 controller and 1 worker is necessary.].",
+        ((ErrorResponse) response.getEntity()).getUnderlyingException().getMessage()
+    );
   }
 
   @Test
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/parser/DruidSqlInsert.java b/sql/src/main/java/org/apache/druid/sql/calcite/parser/DruidSqlInsert.java
index 1dc77885263..1877a212343 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/parser/DruidSqlInsert.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/parser/DruidSqlInsert.java
@@ -39,6 +39,7 @@ import javax.annotation.Nullable;
 public class DruidSqlInsert extends DruidSqlIngest
 {
   public static final String SQL_INSERT_SEGMENT_GRANULARITY = "sqlInsertSegmentGranularity";
+  public static final String SQL_INSERT_QUERY_GRANULARITY = "sqlInsertQueryGranularity";
 
   // This allows reusing super.unparse
   public static final SqlOperator OPERATOR = DruidSqlIngestOperator.INSERT_OPERATOR;

From 3a1b4370567f9655da3d24d427052d550092f8ac Mon Sep 17 00:00:00 2001
From: Laksh Singla <lakshsingla@gmail.com>
Date: Fri, 12 Jul 2024 21:49:12 +0530
Subject: [PATCH 63/72] Improve the fallback strategy when the broker is unable
 to materialize the subquery's results as frames for estimating the bytes
 (#16679)

Better fallback strategy when the broker is unable to materialize the subquery's results as frames for estimating the bytes:
a. We don't touch the subquery sequence till we know that we can materialize the result as frames
---
 .../sql/DoublesSketchSqlAggregatorTest.java   | 143 ++++++++++++++++++
 .../druid/frame/segment/FrameCursorUtils.java |  23 ++-
 .../groupby/GroupByQueryQueryToolChest.java   |   2 +
 .../TimeseriesQueryQueryToolChest.java        |   2 +
 .../query/topn/TopNQueryQueryToolChest.java   |   2 +
 .../server/ClientQuerySegmentWalker.java      |  28 +++-
 6 files changed, 190 insertions(+), 10 deletions(-)

diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java
index 9122e1ecc7e..a85d508a879 100644
--- a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java
@@ -24,8 +24,11 @@ import com.google.common.collect.ImmutableMap;
 import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.guice.DruidInjectorBuilder;
+import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.query.Druids;
+import org.apache.druid.query.JoinDataSource;
+import org.apache.druid.query.QueryContexts;
 import org.apache.druid.query.QueryDataSource;
 import org.apache.druid.query.QueryRunnerFactoryConglomerate;
 import org.apache.druid.query.aggregation.CountAggregatorFactory;
@@ -33,6 +36,7 @@ import org.apache.druid.query.aggregation.DoubleSumAggregatorFactory;
 import org.apache.druid.query.aggregation.FilteredAggregatorFactory;
 import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
 import org.apache.druid.query.aggregation.PostAggregator;
+import org.apache.druid.query.aggregation.cardinality.CardinalityAggregatorFactory;
 import org.apache.druid.query.aggregation.datasketches.SketchQueryContext;
 import org.apache.druid.query.aggregation.datasketches.quantiles.DoublesSketchAggregatorFactory;
 import org.apache.druid.query.aggregation.datasketches.quantiles.DoublesSketchModule;
@@ -43,6 +47,7 @@ import org.apache.druid.query.aggregation.datasketches.quantiles.DoublesSketchTo
 import org.apache.druid.query.aggregation.datasketches.quantiles.DoublesSketchToRankPostAggregator;
 import org.apache.druid.query.aggregation.datasketches.quantiles.DoublesSketchToStringPostAggregator;
 import org.apache.druid.query.aggregation.datasketches.quantiles.sql.DoublesSketchSqlAggregatorTest.DoublesSketchComponentSupplier;
+import org.apache.druid.query.aggregation.hyperloglog.HyperUniqueFinalizingPostAggregator;
 import org.apache.druid.query.aggregation.post.ArithmeticPostAggregator;
 import org.apache.druid.query.aggregation.post.FieldAccessPostAggregator;
 import org.apache.druid.query.dimension.DefaultDimensionSpec;
@@ -53,6 +58,7 @@ import org.apache.druid.segment.IndexBuilder;
 import org.apache.druid.segment.QueryableIndex;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.incremental.IncrementalIndexSchema;
+import org.apache.druid.segment.join.JoinType;
 import org.apache.druid.segment.join.JoinableFactoryWrapper;
 import org.apache.druid.segment.virtual.ExpressionVirtualColumn;
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
@@ -263,6 +269,143 @@ public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
     );
   }
 
+  @Test
+  public void testSubqueryWithNestedGroupBy()
+  {
+    final List<Object[]> expectedResults = ImmutableList.of(
+        new Object[]{946684800000L, "", 1L, "val1"},
+        new Object[]{946684800000L, "1", 1L, "val1"},
+        new Object[]{946684800000L, "10.1", 1L, "val1"},
+        new Object[]{946684800000L, "2", 1L, "val1"},
+        new Object[]{946684800000L, "abc", 1L, "val1"},
+        new Object[]{946684800000L, "def", 1L, "val1"}
+    );
+
+    testQuery(
+        "SELECT\n"
+        + "  MILLIS_TO_TIMESTAMP(946684800000) AS __time,\n"
+        + "  alias.\"user\",\n"
+        + "  alias.days,\n"
+        + "  (CASE WHEN alias.days < quantiles.first_quartile THEN 'val2' \n"
+        + "  WHEN alias.days >= quantiles.first_quartile AND alias.days < quantiles.third_quartile THEN 'val3' \n"
+        + "  WHEN alias.days >= quantiles.third_quartile THEN 'val1' END) AS val4\n"
+        + "FROM (\n"
+        + "  SELECT\n"
+        + "    APPROX_QUANTILE_DS(alias.days, 0.25) AS first_quartile,\n"
+        + "    APPROX_QUANTILE_DS(alias.days, 0.75) AS third_quartile\n"
+        + "  FROM (\n"
+        + "    SELECT\n"
+        + "      dim1 \"user\",\n"
+        + "      COUNT(DISTINCT __time) AS days\n"
+        + "    FROM \"foo\"\n"
+        + "    GROUP BY 1\n"
+        + "  ) AS alias\n"
+        + ") AS quantiles, (\n"
+        + "  SELECT\n"
+        + "    dim1 \"user\",\n"
+        + "    COUNT(DISTINCT __time) AS days\n"
+        + "  FROM \"foo\"\n"
+        + "  GROUP BY 1\n"
+        + ") AS alias\n",
+        ImmutableMap.<String, Object>builder()
+                    .putAll(QUERY_CONTEXT_DEFAULT)
+                    .put(QueryContexts.MAX_SUBQUERY_BYTES_KEY, "100000")
+                    // Disallows the fallback to row based limiting
+                    .put(QueryContexts.MAX_SUBQUERY_ROWS_KEY, "10")
+                    .build(),
+        ImmutableList.of(
+            newScanQueryBuilder()
+                .dataSource(
+                    JoinDataSource.create(
+                        new QueryDataSource(
+                            GroupByQuery.builder()
+                                        .setDataSource(
+                                            new QueryDataSource(
+                                                GroupByQuery.builder()
+                                                            .setDataSource("foo")
+                                                            .setQuerySegmentSpec(querySegmentSpec(Intervals.ETERNITY))
+                                                            .setGranularity(Granularities.ALL)
+                                                            .addDimension(new DefaultDimensionSpec(
+                                                                "dim1",
+                                                                "d0",
+                                                                ColumnType.STRING
+                                                            ))
+                                                            .addAggregator(new CardinalityAggregatorFactory(
+                                                                "a0:a",
+                                                                null,
+                                                                Collections.singletonList(new DefaultDimensionSpec(
+                                                                    "__time",
+                                                                    "__time",
+                                                                    ColumnType.LONG
+                                                                )),
+                                                                false,
+                                                                true
+                                                            ))
+                                                            .setPostAggregatorSpecs(new HyperUniqueFinalizingPostAggregator(
+                                                                "a0",
+                                                                "a0:a"
+                                                            ))
+                                                            .build()
+                                            )
+                                        )
+                                        .setQuerySegmentSpec(querySegmentSpec(Intervals.ETERNITY))
+                                        .setGranularity(Granularities.ALL)
+                                        .addAggregator(new DoublesSketchAggregatorFactory("_a0:agg", "a0", 128))
+                                        .setPostAggregatorSpecs(
+                                            new DoublesSketchToQuantilePostAggregator(
+                                                "_a0",
+                                                new FieldAccessPostAggregator("_a0:agg", "_a0:agg"),
+                                                0.25
+                                            ),
+                                            new DoublesSketchToQuantilePostAggregator(
+                                                "_a1",
+                                                new FieldAccessPostAggregator("_a0:agg", "_a0:agg"),
+                                                0.75
+                                            )
+                                        )
+                                        .build()
+
+                        ),
+                        new QueryDataSource(
+                            GroupByQuery.builder()
+                                        .setDataSource("foo")
+                                        .setQuerySegmentSpec(querySegmentSpec(Intervals.ETERNITY))
+                                        .setGranularity(Granularities.ALL)
+                                        .addDimension(new DefaultDimensionSpec("dim1", "d0", ColumnType.STRING))
+                                        .addAggregator(new CardinalityAggregatorFactory(
+                                            "a0",
+                                            null,
+                                            Collections.singletonList(new DefaultDimensionSpec(
+                                                "__time",
+                                                "__time",
+                                                ColumnType.LONG
+                                            )),
+                                            false,
+                                            true
+                                        ))
+                                        .build()
+                        ),
+                        "j0.",
+                        "1",
+                        JoinType.INNER,
+                        null,
+                        TestExprMacroTable.INSTANCE,
+                        null
+                    )
+                )
+                .intervals(querySegmentSpec(Intervals.ETERNITY))
+                .virtualColumns(
+                    new ExpressionVirtualColumn("v0", "946684800000", ColumnType.LONG, TestExprMacroTable.INSTANCE),
+                    new ExpressionVirtualColumn("v1", "case_searched((\"j0.a0\" < \"_a0\"),'val2',((\"j0.a0\" >= \"_a0\") && (\"j0.a0\" < \"_a1\")),'val3',(\"j0.a0\" >= \"_a1\"),'val1',null)", ColumnType.STRING, TestExprMacroTable.INSTANCE)
+                )
+                .columns("j0.a0", "j0.d0", "v0", "v1")
+                .build()
+        ),
+        expectedResults
+    );
+  }
+
+
   @Test
   public void testQuantileOnCastedString()
   {
diff --git a/processing/src/main/java/org/apache/druid/frame/segment/FrameCursorUtils.java b/processing/src/main/java/org/apache/druid/frame/segment/FrameCursorUtils.java
index 3cb5c686e9d..de970363bb4 100644
--- a/processing/src/main/java/org/apache/druid/frame/segment/FrameCursorUtils.java
+++ b/processing/src/main/java/org/apache/druid/frame/segment/FrameCursorUtils.java
@@ -23,6 +23,7 @@ import org.apache.druid.error.DruidException;
 import org.apache.druid.frame.Frame;
 import org.apache.druid.frame.write.FrameWriter;
 import org.apache.druid.frame.write.FrameWriterFactory;
+import org.apache.druid.frame.write.UnsupportedColumnTypeException;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.guava.Sequence;
 import org.apache.druid.java.util.common.guava.Sequences;
@@ -32,6 +33,7 @@ import org.apache.druid.query.filter.Filter;
 import org.apache.druid.query.ordering.StringComparators;
 import org.apache.druid.segment.Cursor;
 import org.apache.druid.segment.column.ColumnHolder;
+import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.segment.filter.BoundFilter;
 import org.apache.druid.segment.filter.Filters;
 import org.joda.time.Interval;
@@ -100,13 +102,18 @@ public class FrameCursorUtils
   /**
    * Writes a {@link Cursor} to a sequence of {@link Frame}. This method iterates over the rows of the cursor,
    * and writes the columns to the frames. The iterable is lazy, and it traverses the required portion of the cursor
-   * as required
+   * as required.
+   * <p>
+   * If the type is missing from the signature, the method throws an exception without advancing/modifying/closing the
+   * cursor
    */
   public static Iterable<Frame> cursorToFramesIterable(
       final Cursor cursor,
       final FrameWriterFactory frameWriterFactory
   )
   {
+    throwIfColumnsHaveUnknownType(frameWriterFactory.signature());
+
     return () -> new Iterator<Frame>()
     {
       @Override
@@ -158,7 +165,19 @@ public class FrameCursorUtils
       final FrameWriterFactory frameWriterFactory
   )
   {
-
     return Sequences.simple(cursorToFramesIterable(cursor, frameWriterFactory));
   }
+
+  /**
+   * Throws {@link UnsupportedColumnTypeException} if the row signature has columns with unknown types. This is used to
+   * pre-determine if the frames can be materialized as rows, without touching the resource generating the frames.
+   */
+  public static void throwIfColumnsHaveUnknownType(final RowSignature rowSignature)
+  {
+    for (int i = 0; i < rowSignature.size(); ++i) {
+      if (!rowSignature.getColumnType(i).isPresent()) {
+        throw new UnsupportedColumnTypeException(rowSignature.getColumnName(i), null);
+      }
+    }
+  }
 }
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java
index 7588848cf5b..b19b479c26d 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java
@@ -816,6 +816,8 @@ public class GroupByQueryQueryToolChest extends QueryToolChest<ResultRow, GroupB
                                         ? FrameWriterUtils.replaceUnknownTypesWithNestedColumns(rowSignature)
                                         : rowSignature;
 
+    FrameCursorUtils.throwIfColumnsHaveUnknownType(modifiedRowSignature);
+
     FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
         memoryAllocatorFactory,
         modifiedRowSignature,
diff --git a/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java
index 8527d551cf5..17a2f8be956 100644
--- a/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java
@@ -485,6 +485,8 @@ public class TimeseriesQueryQueryToolChest extends QueryToolChest<Result<Timeser
     RowSignature modifiedRowSignature = useNestedForUnknownTypes
                                         ? FrameWriterUtils.replaceUnknownTypesWithNestedColumns(rowSignature)
                                         : rowSignature;
+    FrameCursorUtils.throwIfColumnsHaveUnknownType(modifiedRowSignature);
+
     FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
         memoryAllocatorFactory,
         modifiedRowSignature,
diff --git a/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java
index 02d07e25570..25a4284aa42 100644
--- a/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java
@@ -569,6 +569,8 @@ public class TopNQueryQueryToolChest extends QueryToolChest<Result<TopNResultVal
     RowSignature modifiedRowSignature = useNestedForUnknownTypes
                                         ? FrameWriterUtils.replaceUnknownTypesWithNestedColumns(rowSignature)
                                         : rowSignature;
+    FrameCursorUtils.throwIfColumnsHaveUnknownType(modifiedRowSignature);
+
     FrameWriterFactory frameWriterFactory = FrameWriters.makeColumnBasedFrameWriterFactory(
         memoryAllocatorFactory,
         rowSignature,
diff --git a/server/src/main/java/org/apache/druid/server/ClientQuerySegmentWalker.java b/server/src/main/java/org/apache/druid/server/ClientQuerySegmentWalker.java
index 1d3b38b2fdb..d49ce3909f7 100644
--- a/server/src/main/java/org/apache/druid/server/ClientQuerySegmentWalker.java
+++ b/server/src/main/java/org/apache/druid/server/ClientQuerySegmentWalker.java
@@ -746,6 +746,7 @@ public class ClientQuerySegmentWalker implements QuerySegmentWalker
   {
     Optional<Sequence<FrameSignaturePair>> framesOptional;
 
+    boolean startedAccumulating = false;
     try {
       framesOptional = toolChest.resultsAsFrames(
           query,
@@ -760,6 +761,9 @@ public class ClientQuerySegmentWalker implements QuerySegmentWalker
 
       Sequence<FrameSignaturePair> frames = framesOptional.get();
       List<FrameSignaturePair> frameSignaturePairs = new ArrayList<>();
+
+      startedAccumulating = true;
+
       frames.forEach(
           frame -> {
             limitAccumulator.addAndGet(frame.getFrame().numRows());
@@ -772,21 +776,29 @@ public class ClientQuerySegmentWalker implements QuerySegmentWalker
           }
       );
       return Optional.of(new FrameBasedInlineDataSource(frameSignaturePairs, toolChest.resultArraySignature(query)));
-
-    }
-    catch (ResourceLimitExceededException e) {
-      throw e;
     }
     catch (UnsupportedColumnTypeException e) {
       subqueryStatsProvider.incrementSubqueriesFallingBackDueToUnsufficientTypeInfo();
       log.debug(e, "Type info in signature insufficient to materialize rows as frames.");
       return Optional.empty();
     }
+    catch (ResourceLimitExceededException e) {
+      throw e;
+    }
     catch (Exception e) {
-      subqueryStatsProvider.incrementSubqueriesFallingBackDueToUnknownReason();
-      log.debug(e, "Unable to materialize the results as frames due to an unhandleable exception "
-                   + "while conversion. Defaulting to materializing the results as rows");
-      return Optional.empty();
+      if (startedAccumulating) {
+        // If we have opened the resultSequence, we can't fall back safely as the resultSequence might hold some resources
+        // that we release on exception, and we need to throw the exception to disable the 'maxSubqueryBytes' configuration
+        throw DruidException.defensive()
+                            .build(
+                                e,
+                                "Unable to materialize the results as frames for estimating the byte footprint. "
+                                + "Please disable the 'maxSubqueryBytes' by setting it to 'disabled' in the query context or removing it altogether "
+                                + "from the query context and/or the server config."
+                            );
+      } else {
+        return Optional.empty();
+      }
     }
   }
 

From a618c5dd0dea8917986166e1d4d988f7101ec88d Mon Sep 17 00:00:00 2001
From: Kashif Faraz <kashif.faraz@gmail.com>
Date: Fri, 12 Jul 2024 19:42:51 -0700
Subject: [PATCH 64/72] Refactor: Miscellaneous batch task cleanup (#16730)

Changes
- No functional change
- Remove unused method `IndexTuningConfig.withPartitionsSpec()`
- Remove unused method `ParallelIndexTuningConfig.withPartitionsSpec()`
- Remove redundant method `CompactTask.emitIngestionModeMetrics()`
- Remove Clock argument from `CompactionTask.createDataSchemasForInterval()` as it was only needed
for one test which was just verifying the value passed by the test itself. The code now uses a `Stopwatch`
instead and test simply verifies that the metric has been emitted.
- Other minor cleanup changes
---
 .../msq/indexing/MSQCompactionRunnerTest.java |  1 -
 .../indexing/common/task/CompactionTask.java  | 70 ++++++--------
 .../druid/indexing/common/task/IndexTask.java | 25 -----
 .../common/task/NativeCompactionRunner.java   | 14 ++-
 .../parallel/ParallelIndexTuningConfig.java   | 39 --------
 .../ClientCompactionTaskQuerySerdeTest.java   |  5 +-
 .../task/CompactionTaskParallelRunTest.java   | 45 +++------
 .../common/task/CompactionTaskRunTest.java    | 66 ++++---------
 .../common/task/CompactionTaskTest.java       | 96 ++++---------------
 ...stractParallelIndexSupervisorTaskTest.java | 20 ----
 .../ParallelIndexSupervisorTaskKillTest.java  | 35 ++-----
 ...rallelIndexSupervisorTaskResourceTest.java | 20 +---
 .../batch/parallel/PartialCompactionTest.java |  3 +-
 13 files changed, 104 insertions(+), 335 deletions(-)

diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java
index 35eca8cfcb4..6f1a4396ada 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java
@@ -369,7 +369,6 @@ public class MSQCompactionRunnerTest
         new ClientCompactionTaskTransformSpec(dimFilter);
     final CompactionTask.Builder builder = new CompactionTask.Builder(
         DATA_SOURCE,
-        null,
         null
     );
     IndexSpec indexSpec = createIndexSpec();
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionTask.java
index fe4d09d8481..8659eb0f397 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/CompactionTask.java
@@ -48,7 +48,6 @@ import org.apache.druid.indexer.Property;
 import org.apache.druid.indexer.TaskStatus;
 import org.apache.druid.indexer.partitions.PartitionsSpec;
 import org.apache.druid.indexing.common.LockGranularity;
-import org.apache.druid.indexing.common.RetryPolicyFactory;
 import org.apache.druid.indexing.common.SegmentCacheManagerFactory;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.actions.RetrieveUsedSegmentsAction;
@@ -62,6 +61,7 @@ import org.apache.druid.java.util.common.JodaUtils;
 import org.apache.druid.java.util.common.NonnullPair;
 import org.apache.druid.java.util.common.Pair;
 import org.apache.druid.java.util.common.RE;
+import org.apache.druid.java.util.common.Stopwatch;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.Granularity;
 import org.apache.druid.java.util.common.granularity.GranularityType;
@@ -100,7 +100,6 @@ import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
 import java.io.File;
 import java.io.IOException;
-import java.time.Clock;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
@@ -125,8 +124,6 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
 {
   public static final String TYPE = "compact";
   private static final Logger log = new Logger(CompactionTask.class);
-  private static final Clock UTC_CLOCK = Clock.systemUTC();
-
 
   /**
    * The CompactionTask creates and runs multiple IndexTask instances. When the {@link AppenderatorsManager}
@@ -449,27 +446,12 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
     return tuningConfig != null && tuningConfig.isForceGuaranteedRollup();
   }
 
-  @VisibleForTesting
-  void emitCompactIngestionModeMetrics(
-      ServiceEmitter emitter,
-      boolean isDropExisting
-  )
-  {
-
-    if (emitter == null) {
-      return;
-    }
-    emitMetric(emitter, "ingest/count", 1);
-  }
-
   @Override
   public TaskStatus runTask(TaskToolbox toolbox) throws Exception
   {
-    // emit metric for compact ingestion mode:
-    emitCompactIngestionModeMetrics(toolbox.getEmitter(), ioConfig.isDropExisting());
+    emitMetric(toolbox.getEmitter(), "ingest/count", 1);
 
     final Map<Interval, DataSchema> intervalDataSchemas = createDataSchemasForIntervals(
-        UTC_CLOCK,
         toolbox,
         getTaskLockHelper().getLockGranularityToUse(),
         segmentProvider,
@@ -489,13 +471,13 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
   }
 
   /**
-   * Generate dataschema for segments in each interval
-   * @return
-   * @throws IOException
+   * Generate dataschema for segments in each interval.
+   *
+   * @throws IOException if an exception occurs whie retrieving used segments to
+   * determine schemas.
    */
   @VisibleForTesting
   static Map<Interval, DataSchema> createDataSchemasForIntervals(
-      final Clock clock,
       final TaskToolbox toolbox,
       final LockGranularity lockGranularityInUse,
       final SegmentProvider segmentProvider,
@@ -506,13 +488,13 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
       final ServiceMetricEvent.Builder metricBuilder
   ) throws IOException
   {
-    final List<TimelineObjectHolder<String, DataSegment>> timelineSegments = retrieveRelevantTimelineHolders(
+    final Iterable<DataSegment> timelineSegments = retrieveRelevantTimelineHolders(
         toolbox,
         segmentProvider,
         lockGranularityInUse
     );
 
-    if (timelineSegments.isEmpty()) {
+    if (!timelineSegments.iterator().hasNext()) {
       return Collections.emptyMap();
     }
 
@@ -524,7 +506,7 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
           Comparators.intervalsByStartThenEnd()
       );
 
-      for (final DataSegment dataSegment : VersionedIntervalTimeline.getAllObjects(timelineSegments)) {
+      for (final DataSegment dataSegment : timelineSegments) {
         intervalToSegments.computeIfAbsent(dataSegment.getInterval(), k -> new ArrayList<>())
                           .add(dataSegment);
       }
@@ -557,7 +539,6 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
         // creates new granularitySpec and set segmentGranularity
         Granularity segmentGranularityToUse = GranularityType.fromPeriod(interval.toPeriod()).getDefaultGranularity();
         final DataSchema dataSchema = createDataSchema(
-            clock,
             toolbox.getEmitter(),
             metricBuilder,
             segmentProvider.dataSource,
@@ -576,18 +557,17 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
     } else {
       // given segment granularity
       final DataSchema dataSchema = createDataSchema(
-          clock,
           toolbox.getEmitter(),
           metricBuilder,
           segmentProvider.dataSource,
           JodaUtils.umbrellaInterval(
               Iterables.transform(
-                  VersionedIntervalTimeline.getAllObjects(timelineSegments),
+                  timelineSegments,
                   DataSegment::getInterval
               )
           ),
           lazyFetchSegments(
-              VersionedIntervalTimeline.getAllObjects(timelineSegments),
+              timelineSegments,
               toolbox.getSegmentCacheManager(),
               toolbox.getIndexIO()
           ),
@@ -600,7 +580,7 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
     }
   }
 
-  private static List<TimelineObjectHolder<String, DataSegment>> retrieveRelevantTimelineHolders(
+  private static Iterable<DataSegment> retrieveRelevantTimelineHolders(
       TaskToolbox toolbox,
       SegmentProvider segmentProvider,
       LockGranularity lockGranularityInUse
@@ -612,11 +592,10 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
     final List<TimelineObjectHolder<String, DataSegment>> timelineSegments = SegmentTimeline
         .forSegments(usedSegments)
         .lookup(segmentProvider.interval);
-    return timelineSegments;
+    return VersionedIntervalTimeline.getAllObjects(timelineSegments);
   }
 
   private static DataSchema createDataSchema(
-      Clock clock,
       ServiceEmitter emitter,
       ServiceMetricEvent.Builder metricBuilder,
       String dataSource,
@@ -636,24 +615,30 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
         dimensionsSpec == null,
         metricsSpec == null
     );
-    long start = clock.millis();
+
+    final Stopwatch stopwatch = Stopwatch.createStarted();
     try {
       existingSegmentAnalyzer.fetchAndProcessIfNeeded();
     }
     finally {
       if (emitter != null) {
-        emitter.emit(metricBuilder.setMetric("compact/segmentAnalyzer/fetchAndProcessMillis", clock.millis() - start));
+        emitter.emit(
+            metricBuilder.setMetric(
+                "compact/segmentAnalyzer/fetchAndProcessMillis",
+                stopwatch.millisElapsed()
+            )
+        );
       }
     }
 
     final Granularity queryGranularityToUse;
     if (granularitySpec.getQueryGranularity() == null) {
       queryGranularityToUse = existingSegmentAnalyzer.getQueryGranularity();
-      log.info("Generate compaction task spec with segments original query granularity [%s]", queryGranularityToUse);
+      log.info("Generate compaction task spec with segments original query granularity[%s]", queryGranularityToUse);
     } else {
       queryGranularityToUse = granularitySpec.getQueryGranularity();
       log.info(
-          "Generate compaction task spec with new query granularity overrided from input [%s]",
+          "Generate compaction task spec with new query granularity overrided from input[%s].",
           queryGranularityToUse
       );
     }
@@ -1033,7 +1018,6 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
   {
     private final String dataSource;
     private final SegmentCacheManagerFactory segmentCacheManagerFactory;
-    private final RetryPolicyFactory retryPolicyFactory;
 
     private CompactionIOConfig ioConfig;
     @Nullable
@@ -1054,13 +1038,11 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
 
     public Builder(
         String dataSource,
-        SegmentCacheManagerFactory segmentCacheManagerFactory,
-        RetryPolicyFactory retryPolicyFactory
+        SegmentCacheManagerFactory segmentCacheManagerFactory
     )
     {
       this.dataSource = dataSource;
       this.segmentCacheManagerFactory = segmentCacheManagerFactory;
-      this.retryPolicyFactory = retryPolicyFactory;
     }
 
     public Builder interval(Interval interval)
@@ -1288,7 +1270,9 @@ public class CompactionTask extends AbstractBatchIndexTask implements PendingSeg
       );
     }
 
-    @Override
+    /**
+     * Creates a copy of this tuning config with the partition spec changed.
+     */
     public CompactionTuningConfig withPartitionsSpec(PartitionsSpec partitionsSpec)
     {
       return new CompactionTuningConfig(
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/IndexTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/IndexTask.java
index cc253f46a52..dc6c07b6b83 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/IndexTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/IndexTask.java
@@ -1471,31 +1471,6 @@ public class IndexTask extends AbstractBatchIndexTask implements ChatHandler, Pe
       );
     }
 
-    public IndexTuningConfig withPartitionsSpec(PartitionsSpec partitionsSpec)
-    {
-      return new IndexTuningConfig(
-          appendableIndexSpec,
-          maxRowsInMemory,
-          maxBytesInMemory,
-          skipBytesInMemoryOverheadCheck,
-          partitionsSpec,
-          indexSpec,
-          indexSpecForIntermediatePersists,
-          maxPendingPersists,
-          forceGuaranteedRollup,
-          reportParseExceptions,
-          pushTimeout,
-          basePersistDirectory,
-          segmentWriteOutMediumFactory,
-          logParseExceptions,
-          maxParseExceptions,
-          maxSavedParseExceptions,
-          maxColumnsToMerge,
-          awaitSegmentAvailabilityTimeoutMillis,
-          numPersistThreads
-      );
-    }
-
     @JsonProperty
     @Override
     public AppendableIndexSpec getAppendableIndexSpec()
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/NativeCompactionRunner.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/NativeCompactionRunner.java
index 722c6010b20..f2eacb8c1c6 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/NativeCompactionRunner.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/NativeCompactionRunner.java
@@ -56,11 +56,14 @@ import java.util.stream.IntStream;
 
 public class NativeCompactionRunner implements CompactionRunner
 {
-  private static final Logger log = new Logger(NativeCompactionRunner.class);
   public static final String TYPE = "native";
+
+  private static final Logger log = new Logger(NativeCompactionRunner.class);
   private static final boolean STORE_COMPACTION_STATE = true;
+
   @JsonIgnore
   private final SegmentCacheManagerFactory segmentCacheManagerFactory;
+
   @JsonIgnore
   private final CurrentSubTaskHolder currentSubTaskHolder = new CurrentSubTaskHolder(
       (taskObject, config) -> {
@@ -183,7 +186,6 @@ public class NativeCompactionRunner implements CompactionRunner
     final PartitionConfigurationManager partitionConfigurationManager =
         new NativeCompactionRunner.PartitionConfigurationManager(compactionTask.getTuningConfig());
 
-
     final List<ParallelIndexIngestionSpec> ingestionSpecs = createIngestionSpecs(
         intervalDataSchemaMap,
         taskToolbox,
@@ -278,8 +280,11 @@ public class NativeCompactionRunner implements CompactionRunner
     return failCnt == 0 ? TaskStatus.success(compactionTaskId) : TaskStatus.failure(compactionTaskId, msg);
   }
 
-  @VisibleForTesting
-  ParallelIndexSupervisorTask newTask(CompactionTask compactionTask, String baseSequenceName, ParallelIndexIngestionSpec ingestionSpec)
+  private ParallelIndexSupervisorTask newTask(
+      CompactionTask compactionTask,
+      String baseSequenceName,
+      ParallelIndexIngestionSpec ingestionSpec
+  )
   {
     return new ParallelIndexSupervisorTask(
         compactionTask.getId(),
@@ -305,7 +310,6 @@ public class NativeCompactionRunner implements CompactionRunner
   @VisibleForTesting
   static class PartitionConfigurationManager
   {
-    @Nullable
     private final CompactionTask.CompactionTuningConfig tuningConfig;
 
     PartitionConfigurationManager(@Nullable CompactionTask.CompactionTuningConfig tuningConfig)
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTuningConfig.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTuningConfig.java
index 7e33261ee7c..d97d9beff34 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTuningConfig.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTuningConfig.java
@@ -275,45 +275,6 @@ public class ParallelIndexTuningConfig extends IndexTuningConfig
     return maxAllowedLockCount;
   }
 
-  @Override
-  public ParallelIndexTuningConfig withPartitionsSpec(PartitionsSpec partitionsSpec)
-  {
-    return new ParallelIndexTuningConfig(
-        null,
-        null,
-        getAppendableIndexSpec(),
-        getMaxRowsInMemory(),
-        getMaxBytesInMemory(),
-        isSkipBytesInMemoryOverheadCheck(),
-        null,
-        null,
-        getSplitHintSpec(),
-        partitionsSpec,
-        getIndexSpec(),
-        getIndexSpecForIntermediatePersists(),
-        getMaxPendingPersists(),
-        isForceGuaranteedRollup(),
-        isReportParseExceptions(),
-        getPushTimeout(),
-        getSegmentWriteOutMediumFactory(),
-        null,
-        getMaxNumConcurrentSubTasks(),
-        getMaxRetry(),
-        getTaskStatusCheckPeriodMs(),
-        getChatHandlerTimeout(),
-        getChatHandlerNumRetries(),
-        getMaxNumSegmentsToMerge(),
-        getTotalNumMergeTasks(),
-        isLogParseExceptions(),
-        getMaxParseExceptions(),
-        getMaxSavedParseExceptions(),
-        getMaxColumnsToMerge(),
-        getAwaitSegmentAvailabilityTimeoutMillis(),
-        getMaxAllowedLockCount(),
-        getNumPersistThreads()
-    );
-  }
-
   @Override
   public boolean equals(Object o)
   {
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java
index 3d6c8085c98..fcded3ab9ee 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java
@@ -43,8 +43,6 @@ import org.apache.druid.guice.GuiceInjectableValues;
 import org.apache.druid.guice.GuiceInjectors;
 import org.apache.druid.indexer.CompactionEngine;
 import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
-import org.apache.druid.indexing.common.RetryPolicyConfig;
-import org.apache.druid.indexing.common.RetryPolicyFactory;
 import org.apache.druid.indexing.common.SegmentCacheManagerFactory;
 import org.apache.druid.indexing.common.TestUtils;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexTuningConfig;
@@ -340,8 +338,7 @@ public class ClientCompactionTaskQuerySerdeTest
   {
     CompactionTask.Builder compactionTaskBuilder = new CompactionTask.Builder(
         "datasource",
-        new SegmentCacheManagerFactory(TestIndex.INDEX_IO, MAPPER),
-        new RetryPolicyFactory(new RetryPolicyConfig())
+        new SegmentCacheManagerFactory(TestIndex.INDEX_IO, MAPPER)
     )
         .inputSpec(new CompactionIntervalSpec(Intervals.of("2019/2020"), "testSha256OfSortedSegmentIds"), true)
         .tuningConfig(
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskParallelRunTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskParallelRunTest.java
index ba9a6e3e2be..188ea3cdd07 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskParallelRunTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskParallelRunTest.java
@@ -41,8 +41,6 @@ import org.apache.druid.indexer.partitions.PartitionsSpec;
 import org.apache.druid.indexer.partitions.SingleDimensionPartitionsSpec;
 import org.apache.druid.indexer.report.IngestionStatsAndErrors;
 import org.apache.druid.indexing.common.LockGranularity;
-import org.apache.druid.indexing.common.RetryPolicyConfig;
-import org.apache.druid.indexing.common.RetryPolicyFactory;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.actions.TaskActionClient;
 import org.apache.druid.indexing.common.task.CompactionTask.Builder;
@@ -114,7 +112,6 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
   }
 
   private static final String DATA_SOURCE = "test";
-  private static final RetryPolicyFactory RETRY_POLICY_FACTORY = new RetryPolicyFactory(new RetryPolicyConfig());
   private static final Interval INTERVAL_TO_INDEX = Intervals.of("2014-01-01/2014-01-02");
 
   private final LockGranularity lockGranularity;
@@ -160,8 +157,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -215,8 +211,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -281,8 +276,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -332,8 +326,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
 
     final CompactionTask compactionTask = builder
@@ -395,8 +388,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -449,8 +441,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -500,8 +491,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -551,8 +541,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -582,8 +571,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -639,8 +627,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -702,8 +689,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
     runIndexTask(null, true);
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -752,8 +738,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
     runIndexTask(null, true);
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
@@ -844,8 +829,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         // Set the dropExisting flag to true in the IOConfig of the compaction task
@@ -891,8 +875,7 @@ public class CompactionTaskParallelRunTest extends AbstractParallelIndexSupervis
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
     final CompactionTask compactionTask = builder
         .inputSpec(new CompactionIntervalSpec(INTERVAL_TO_INDEX, null))
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskRunTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskRunTest.java
index 599a24fac80..54902d5f7c6 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskRunTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskRunTest.java
@@ -45,8 +45,6 @@ import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
 import org.apache.druid.indexer.report.IngestionStatsAndErrors;
 import org.apache.druid.indexer.report.SingleFileTaskReportFileWriter;
 import org.apache.druid.indexing.common.LockGranularity;
-import org.apache.druid.indexing.common.RetryPolicyConfig;
-import org.apache.druid.indexing.common.RetryPolicyFactory;
 import org.apache.druid.indexing.common.SegmentCacheManagerFactory;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.TestUtils;
@@ -180,7 +178,6 @@ public class CompactionTaskRunTest extends IngestionTestBase
   }
 
   private static final String DATA_SOURCE = "test";
-  private static final RetryPolicyFactory RETRY_POLICY_FACTORY = new RetryPolicyFactory(new RetryPolicyConfig());
   private final OverlordClient overlordClient;
   private final CoordinatorClient coordinatorClient;
   private final SegmentCacheManagerFactory segmentCacheManagerFactory;
@@ -284,8 +281,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask = builder
@@ -352,8 +348,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask = builder
@@ -452,8 +447,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask1 = builder
@@ -547,8 +541,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask = builder
@@ -659,8 +652,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     // day segmentGranularity
@@ -729,8 +721,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask1 = builder
@@ -764,8 +755,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     // day segmentGranularity
@@ -809,8 +799,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     // day segmentGranularity
@@ -869,8 +858,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     // day segmentGranularity
@@ -935,8 +923,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     // day segmentGranularity
@@ -1004,8 +991,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     // day queryGranularity
@@ -1058,8 +1044,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     // day segmentGranularity and day queryGranularity
@@ -1097,8 +1082,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask1 = builder
@@ -1150,8 +1134,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask = builder
@@ -1212,8 +1195,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     // Setup partial compaction:
@@ -1368,8 +1350,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     // Setup partial interval compaction:
@@ -1476,8 +1457,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final Interval partialInterval = Intervals.of("2014-01-01T01:00:00/2014-01-01T02:00:00");
@@ -1548,8 +1528,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask = builder
@@ -1603,8 +1582,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask = builder
@@ -1694,8 +1672,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask = builder
@@ -1826,8 +1803,7 @@ public class CompactionTaskRunTest extends IngestionTestBase
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask compactionTask = builder
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
index 48a7932a241..b138a25469f 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
@@ -57,8 +57,6 @@ import org.apache.druid.guice.IndexingServiceTuningConfigModule;
 import org.apache.druid.indexer.TaskStatus;
 import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
 import org.apache.druid.indexing.common.LockGranularity;
-import org.apache.druid.indexing.common.RetryPolicyConfig;
-import org.apache.druid.indexing.common.RetryPolicyFactory;
 import org.apache.druid.indexing.common.SegmentCacheManagerFactory;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.TestUtils;
@@ -84,8 +82,6 @@ import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.java.util.common.granularity.Granularity;
 import org.apache.druid.java.util.common.granularity.PeriodGranularity;
 import org.apache.druid.java.util.common.guava.Comparators;
-import org.apache.druid.java.util.emitter.core.NoopEmitter;
-import org.apache.druid.java.util.emitter.service.ServiceEmitter;
 import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.apache.druid.query.aggregation.AggregatorFactory;
@@ -148,15 +144,12 @@ import org.junit.Rule;
 import org.junit.Test;
 import org.junit.rules.ExpectedException;
 import org.junit.runner.RunWith;
-import org.mockito.Mock;
-import org.mockito.Mockito;
 import org.mockito.junit.MockitoJUnitRunner;
 
 import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
 import java.io.File;
 import java.io.IOException;
-import java.time.Clock;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
@@ -198,7 +191,6 @@ public class CompactionTaskTest
   private static final Map<DataSegment, File> SEGMENT_MAP = new HashMap<>();
   private static final CoordinatorClient COORDINATOR_CLIENT = new TestCoordinatorClient(SEGMENT_MAP);
   private static final ObjectMapper OBJECT_MAPPER = setupInjectablesInObjectMapper(new DefaultObjectMapper());
-  private static final RetryPolicyFactory RETRY_POLICY_FACTORY = new RetryPolicyFactory(new RetryPolicyConfig());
   private static final String CONFLICTING_SEGMENT_GRANULARITY_FORMAT =
       "Conflicting segment granularities found %s(segmentGranularity) and %s(granularitySpec.segmentGranularity).\n"
       + "Remove `segmentGranularity` and set the `granularitySpec.segmentGranularity` to the expected granularity";
@@ -375,8 +367,6 @@ public class CompactionTaskTest
   @Rule
   public ExpectedException expectedException = ExpectedException.none();
 
-  @Mock
-  private Clock clock;
   private StubServiceEmitter emitter;
 
   @Before
@@ -389,7 +379,6 @@ public class CompactionTaskTest
         testIndexIO,
         SEGMENT_MAP
     );
-    Mockito.when(clock.millis()).thenReturn(0L, 10_000L);
     segmentCacheManagerFactory = new SegmentCacheManagerFactory(TestIndex.INDEX_IO, OBJECT_MAPPER);
   }
 
@@ -398,8 +387,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     builder.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
     builder.tuningConfig(createTuningConfig());
@@ -408,8 +396,7 @@ public class CompactionTaskTest
 
     final Builder builder2 = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     builder2.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
     builder2.tuningConfig(createTuningConfig());
@@ -421,33 +408,12 @@ public class CompactionTaskTest
     );
   }
 
-  @Test
-  public void testCompactionTaskEmitter()
-  {
-    final Builder builder = new Builder(
-        DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
-    );
-    builder.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
-    builder.tuningConfig(createTuningConfig());
-    builder.segmentGranularity(Granularities.HOUR);
-    final CompactionTask taskCreatedWithSegmentGranularity = builder.build();
-
-    // null emitter should work
-    taskCreatedWithSegmentGranularity.emitCompactIngestionModeMetrics(null, false);
-    // non-null should also work
-    ServiceEmitter noopEmitter = new ServiceEmitter("service", "host", new NoopEmitter());
-    taskCreatedWithSegmentGranularity.emitCompactIngestionModeMetrics(noopEmitter, false);
-    taskCreatedWithSegmentGranularity.emitCompactIngestionModeMetrics(noopEmitter, true);
-  }
-
   @Test(expected = IAE.class)
   public void testCreateCompactionTaskWithConflictingGranularitySpecAndSegmentGranularityShouldThrowIAE()
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     builder.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
     builder.tuningConfig(createTuningConfig());
@@ -477,7 +443,7 @@ public class CompactionTaskTest
         new ClientCompactionTaskTransformSpec(new SelectorDimFilter("dim1", "foo", null));
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     builder.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
     builder.tuningConfig(createTuningConfig());
@@ -495,8 +461,7 @@ public class CompactionTaskTest
     AggregatorFactory[] aggregatorFactories = new AggregatorFactory[]{new CountAggregatorFactory("cnt")};
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     builder.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
     builder.tuningConfig(createTuningConfig());
@@ -513,8 +478,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     builder.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
     builder.tuningConfig(createTuningConfig());
@@ -542,8 +506,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     builder.inputSpec(new CompactionIntervalSpec(COMPACTION_INTERVAL, SegmentUtils.hashIds(SEGMENTS)));
     builder.tuningConfig(createTuningConfig());
@@ -558,8 +521,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     final CompactionTask task = builder
         .inputSpec(
@@ -579,8 +541,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     final CompactionTask task = builder
         .segments(SEGMENTS)
@@ -598,8 +559,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask task = builder
@@ -675,14 +635,12 @@ public class CompactionTaskTest
         toolbox.getRowIngestionMetersFactory(),
         COORDINATOR_CLIENT,
         segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY,
         toolbox.getAppenderatorsManager()
     );
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     final CompactionTask expectedFromJson = builder
@@ -702,8 +660,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory,
-        RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     final CompactionTask task = builder
         .inputSpec(
@@ -910,7 +867,6 @@ public class CompactionTaskTest
   public void testCreateIngestionSchema() throws IOException
   {
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -992,7 +948,6 @@ public class CompactionTaskTest
         null
     );
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1075,7 +1030,6 @@ public class CompactionTaskTest
         null
     );
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1158,7 +1112,6 @@ public class CompactionTaskTest
         null
     );
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1229,7 +1182,6 @@ public class CompactionTaskTest
     );
 
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1280,7 +1232,6 @@ public class CompactionTaskTest
     };
 
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1324,7 +1275,6 @@ public class CompactionTaskTest
   public void testCreateIngestionSchemaWithCustomSegments() throws IOException
   {
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1375,7 +1325,6 @@ public class CompactionTaskTest
     // Remove one segment in the middle
     segments.remove(segments.size() / 2);
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, SpecificSegmentsSpec.fromSegments(segments)),
@@ -1406,7 +1355,6 @@ public class CompactionTaskTest
     indexIO.removeMetadata(Iterables.getFirst(indexIO.getQueryableIndexMap().keySet(), null));
     final List<DataSegment> segments = new ArrayList<>(SEGMENTS);
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, SpecificSegmentsSpec.fromSegments(segments)),
@@ -1435,7 +1383,7 @@ public class CompactionTaskTest
 
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
 
     @SuppressWarnings("unused")
@@ -1448,7 +1396,6 @@ public class CompactionTaskTest
   public void testSegmentGranularityAndNullQueryGranularity() throws IOException
   {
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1493,7 +1440,6 @@ public class CompactionTaskTest
   public void testQueryGranularityAndNullSegmentGranularity() throws IOException
   {
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1535,7 +1481,6 @@ public class CompactionTaskTest
   public void testQueryGranularityAndSegmentGranularityNonNull() throws IOException
   {
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1580,14 +1525,13 @@ public class CompactionTaskTest
         new PeriodGranularity(Period.months(3), null, null),
         BatchIOConfig.DEFAULT_DROP_EXISTING
     );
-    emitter.verifyValue("compact/segmentAnalyzer/fetchAndProcessMillis", 10_000L);
+    emitter.verifyEmitted("compact/segmentAnalyzer/fetchAndProcessMillis", 1);
   }
 
   @Test
   public void testNullGranularitySpec() throws IOException
   {
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1633,7 +1577,6 @@ public class CompactionTaskTest
       throws IOException
   {
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1679,7 +1622,6 @@ public class CompactionTaskTest
       throws IOException
   {
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1710,7 +1652,6 @@ public class CompactionTaskTest
       throws IOException
   {
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
-        clock,
         toolbox,
         LockGranularity.TIME_CHUNK,
         new SegmentProvider(DATA_SOURCE, new CompactionIntervalSpec(COMPACTION_INTERVAL, null)),
@@ -1752,7 +1693,7 @@ public class CompactionTaskTest
         Granularities.ALL,
         Granularities.MINUTE
     );
-    Assert.assertTrue(Granularities.SECOND.equals(chooseFinestGranularityHelper(input)));
+    Assert.assertEquals(Granularities.SECOND, chooseFinestGranularityHelper(input));
   }
 
   @Test
@@ -1769,7 +1710,7 @@ public class CompactionTaskTest
         Granularities.NONE,
         Granularities.MINUTE
     );
-    Assert.assertTrue(Granularities.NONE.equals(chooseFinestGranularityHelper(input)));
+    Assert.assertEquals(Granularities.NONE, chooseFinestGranularityHelper(input));
   }
 
   @Test
@@ -1789,7 +1730,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     final CompactionTask task = builder
         .interval(Intervals.of("2000-01-01/2000-01-02"))
@@ -1802,7 +1743,7 @@ public class CompactionTaskTest
   {
     final Builder builder = new Builder(
         DATA_SOURCE,
-        segmentCacheManagerFactory, RETRY_POLICY_FACTORY
+        segmentCacheManagerFactory
     );
     final CompactionTask task = builder
         .interval(Intervals.of("2000-01-01/2000-01-02"))
@@ -2270,7 +2211,6 @@ public class CompactionTaskTest
         @JacksonInject RowIngestionMetersFactory rowIngestionMetersFactory,
         @JacksonInject CoordinatorClient coordinatorClient,
         @JacksonInject SegmentCacheManagerFactory segmentCacheManagerFactory,
-        @JacksonInject RetryPolicyFactory retryPolicyFactory,
         @JacksonInject AppenderatorsManager appenderatorsManager
     )
     {
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/AbstractParallelIndexSupervisorTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/AbstractParallelIndexSupervisorTaskTest.java
index ecc4f702d6a..8f68846cd64 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/AbstractParallelIndexSupervisorTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/AbstractParallelIndexSupervisorTaskTest.java
@@ -64,7 +64,6 @@ import org.apache.druid.indexing.common.stats.DropwizardRowIngestionMetersFactor
 import org.apache.druid.indexing.common.task.CompactionTask;
 import org.apache.druid.indexing.common.task.IngestionTestBase;
 import org.apache.druid.indexing.common.task.Task;
-import org.apache.druid.indexing.common.task.TaskResource;
 import org.apache.druid.indexing.common.task.Tasks;
 import org.apache.druid.indexing.common.task.TestAppenderatorsManager;
 import org.apache.druid.indexing.overlord.Segments;
@@ -754,25 +753,6 @@ public class AbstractParallelIndexSupervisorTaskTest extends IngestionTestBase
         .build();
   }
 
-  static class TestParallelIndexSupervisorTask extends ParallelIndexSupervisorTask
-  {
-    TestParallelIndexSupervisorTask(
-        String id,
-        TaskResource taskResource,
-        ParallelIndexIngestionSpec ingestionSchema,
-        Map<String, Object> context
-    )
-    {
-      super(
-          id,
-          null,
-          taskResource,
-          ingestionSchema,
-          context
-      );
-    }
-  }
-
   static class LocalShuffleClient implements ShuffleClient<GenericPartitionLocation>
   {
     private final IntermediaryDataManager intermediaryDataManager;
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskKillTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskKillTest.java
index a32aed819e0..14e1bab9540 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskKillTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskKillTest.java
@@ -40,13 +40,10 @@ import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
 import org.apache.druid.segment.indexing.DataSchema;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
-import org.hamcrest.CoreMatchers;
 import org.joda.time.Interval;
 import org.junit.After;
 import org.junit.Assert;
-import org.junit.Rule;
 import org.junit.Test;
-import org.junit.rules.ExpectedException;
 
 import javax.annotation.Nullable;
 import java.util.ArrayList;
@@ -59,8 +56,6 @@ import java.util.stream.Stream;
 
 public class ParallelIndexSupervisorTaskKillTest extends AbstractParallelIndexSupervisorTaskTest
 {
-  @Rule
-  public ExpectedException expectedException = ExpectedException.none();
 
   public ParallelIndexSupervisorTaskKillTest()
   {
@@ -81,7 +76,7 @@ public class ParallelIndexSupervisorTaskKillTest extends AbstractParallelIndexSu
         Intervals.of("2017/2018"),
         new ParallelIndexIOConfig(
             null,
-            // Sub tasks would run forever
+            // Sub-tasks would run forever
             new TestInputSource(Pair.of(new TestInput(Integer.MAX_VALUE, TaskState.SUCCESS), 4)),
             new NoopInputFormat(),
             false,
@@ -93,16 +88,12 @@ public class ParallelIndexSupervisorTaskKillTest extends AbstractParallelIndexSu
       Thread.sleep(100);
     }
     task.stopGracefully(null);
-    expectedException.expect(RuntimeException.class);
-    expectedException.expectCause(CoreMatchers.instanceOf(ExecutionException.class));
-    getIndexingServiceClient().waitToFinish(task, 3000L, TimeUnit.MILLISECONDS);
 
-    final SinglePhaseParallelIndexTaskRunner runner = (SinglePhaseParallelIndexTaskRunner) task.getCurrentRunner();
-    Assert.assertTrue(runner.getRunningTaskIds().isEmpty());
-    // completeSubTaskSpecs should be empty because no task has reported its status to TaskMonitor
-    Assert.assertTrue(runner.getCompleteSubTaskSpecs().isEmpty());
-
-    Assert.assertEquals(4, runner.getTaskMonitor().getNumCanceledTasks());
+    Exception e = Assert.assertThrows(
+        RuntimeException.class,
+        () -> getIndexingServiceClient().waitToFinish(task, 3000L, TimeUnit.MILLISECONDS)
+    );
+    Assert.assertTrue(e.getCause() instanceof ExecutionException);
   }
 
   @Test(timeout = 5000L)
@@ -273,28 +264,20 @@ public class ParallelIndexSupervisorTaskKillTest extends AbstractParallelIndexSu
     }
   }
 
-  private static class TestSupervisorTask extends TestParallelIndexSupervisorTask
+  private static class TestSupervisorTask extends ParallelIndexSupervisorTask
   {
     private TestSupervisorTask(
         ParallelIndexIngestionSpec ingestionSchema,
         Map<String, Object> context
     )
     {
-      super(
-          null,
-          null,
-          ingestionSchema,
-          context
-      );
+      super(null, null, null, ingestionSchema, context);
     }
 
     @Override
     SinglePhaseParallelIndexTaskRunner createSinglePhaseTaskRunner(TaskToolbox toolbox)
     {
-      return new TestRunner(
-          toolbox,
-          this
-      );
+      return new TestRunner(toolbox, this);
     }
   }
 
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskResourceTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskResourceTest.java
index 772bdafb2b1..01d502de85c 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskResourceTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskResourceTest.java
@@ -290,19 +290,11 @@ public class ParallelIndexSupervisorTaskResourceTest extends AbstractParallelInd
     Assert.assertEquals(200, response.getStatus());
     final ParallelIndexingPhaseProgress monitorStatus = (ParallelIndexingPhaseProgress) response.getEntity();
 
-    // numRunningTasks
+    // Verify the number of tasks in different states
     Assert.assertEquals(runningTasks.size(), monitorStatus.getRunning());
-
-    // numSucceededTasks
     Assert.assertEquals(expectedSucceededTasks, monitorStatus.getSucceeded());
-
-    // numFailedTasks
     Assert.assertEquals(expectedFailedTask, monitorStatus.getFailed());
-
-    // numCompleteTasks
     Assert.assertEquals(expectedSucceededTasks + expectedFailedTask, monitorStatus.getComplete());
-
-    // numTotalTasks
     Assert.assertEquals(runningTasks.size() + expectedSucceededTasks + expectedFailedTask, monitorStatus.getTotal());
 
     // runningSubTasks
@@ -407,7 +399,6 @@ public class ParallelIndexSupervisorTaskResourceTest extends AbstractParallelInd
       ParallelIndexIOConfig ioConfig
   )
   {
-    // set up ingestion spec
     final ParallelIndexIngestionSpec ingestionSpec = new ParallelIndexIngestionSpec(
         new DataSchema(
             "dataSource",
@@ -460,7 +451,6 @@ public class ParallelIndexSupervisorTaskResourceTest extends AbstractParallelInd
         )
     );
 
-    // set up test tools
     return new TestSupervisorTask(
         null,
         null,
@@ -503,7 +493,7 @@ public class ParallelIndexSupervisorTaskResourceTest extends AbstractParallelInd
     }
   }
 
-  private class TestSupervisorTask extends TestParallelIndexSupervisorTask
+  private class TestSupervisorTask extends ParallelIndexSupervisorTask
   {
     TestSupervisorTask(
         String id,
@@ -514,6 +504,7 @@ public class ParallelIndexSupervisorTaskResourceTest extends AbstractParallelInd
     {
       super(
           id,
+          null,
           taskResource,
           ingestionSchema,
           context
@@ -523,10 +514,7 @@ public class ParallelIndexSupervisorTaskResourceTest extends AbstractParallelInd
     @Override
     SinglePhaseParallelIndexTaskRunner createSinglePhaseTaskRunner(TaskToolbox toolbox)
     {
-      return new TestRunner(
-          toolbox,
-          this
-      );
+      return new TestRunner(toolbox, this);
     }
   }
 
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialCompactionTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialCompactionTest.java
index a14d11d6f78..15201e884d3 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialCompactionTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialCompactionTest.java
@@ -241,8 +241,7 @@ public class PartialCompactionTest extends AbstractMultiPhaseParallelIndexingTes
   {
     return new Builder(
         DATASOURCE,
-        getSegmentCacheManagerFactory(),
-        RETRY_POLICY_FACTORY
+        getSegmentCacheManagerFactory()
     );
   }
 }

From 656667ee8973147277e46368d6132fd8acbf3a08 Mon Sep 17 00:00:00 2001
From: Kashif Faraz <kashif.faraz@gmail.com>
Date: Sun, 14 Jul 2024 21:43:06 -0700
Subject: [PATCH 65/72] Tests: Add utility class TuningConfigBuilder to make
 IndexTask tests more readable and concise (#16732)

Changes:
- No functional change
- Add class `TuningConfigBuilder` to build `IndexTuningConfig`, `CompactionTuningConfig`
- Remove old class `ParallelIndexTestingFactory.TuningConfigBuilder`
- Remove some unused fields and methods
---
 .../msq/indexing/MSQCompactionRunnerTest.java |  45 +-
 .../druid/indexing/common/TestIndexTask.java  |  36 +-
 .../ClientCompactionTaskQuerySerdeTest.java   |  55 +-
 .../common/task/CompactionTaskRunTest.java    |  39 +-
 .../common/task/CompactionTaskTest.java       | 534 ++++++------------
 .../task/CompactionTuningConfigTest.java      | 152 +----
 .../common/task/IndexTaskSerdeTest.java       | 188 +-----
 .../indexing/common/task/IndexTaskTest.java   | 149 ++---
 .../indexing/common/task/TaskSerdeTest.java   |  69 +--
 .../common/task/TuningConfigBuilder.java      | 415 ++++++++++++++
 ...stractParallelIndexSupervisorTaskTest.java |  86 +--
 .../ParallelIndexSupervisorTaskKillTest.java  |  36 +-
 ...rallelIndexSupervisorTaskResourceTest.java |  36 +-
 .../ParallelIndexSupervisorTaskSerdeTest.java |  60 +-
 .../ParallelIndexSupervisorTaskTest.java      | 195 +++----
 .../parallel/ParallelIndexTestingFactory.java | 147 -----
 .../ParallelIndexTuningConfigTest.java        | 351 ++----------
 .../PartialDimensionCardinalityTaskTest.java  |  71 ++-
 .../PartialDimensionDistributionTaskTest.java |  92 +--
 .../PartialGenericSegmentMergeTaskTest.java   |  21 +-
 .../PartialHashSegmentGenerateTaskTest.java   |  11 +-
 .../PartialRangeSegmentGenerateTaskTest.java  |  30 +-
 .../PartialSegmentMergeIOConfigTest.java      |   9 -
 .../PartialSegmentMergeIngestionSpecTest.java |  22 +-
 .../SinglePhaseParallelIndexingTest.java      | 123 +---
 .../indexing/overlord/TaskLifecycleTest.java  | 136 +----
 26 files changed, 1081 insertions(+), 2027 deletions(-)
 create mode 100644 indexing-service/src/test/java/org/apache/druid/indexing/common/task/TuningConfigBuilder.java

diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java
index 6f1a4396ada..b95243f7783 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/MSQCompactionRunnerTest.java
@@ -39,6 +39,7 @@ import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
 import org.apache.druid.indexer.partitions.PartitionsSpec;
 import org.apache.druid.indexing.common.task.CompactionIntervalSpec;
 import org.apache.druid.indexing.common.task.CompactionTask;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.granularity.Granularities;
@@ -397,39 +398,17 @@ public class MSQCompactionRunnerTest
       PartitionsSpec partitionsSpec
   )
   {
-    return new CompactionTask.CompactionTuningConfig(
-        null,
-        null, // null to compute maxRowsPerSegment automatically
-        null,
-        500000,
-        1000000L,
-        null,
-        null,
-        null,
-        null,
-        partitionsSpec,
-        indexSpec,
-        null,
-        null,
-        !(partitionsSpec instanceof DynamicPartitionsSpec),
-        false,
-        5000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    return TuningConfigBuilder
+        .forCompactionTask()
+        .withMaxRowsInMemory(500000)
+        .withMaxBytesInMemory(1000000L)
+        .withMaxTotalRows(Long.MAX_VALUE)
+        .withPartitionsSpec(partitionsSpec)
+        .withIndexSpec(indexSpec)
+        .withForceGuaranteedRollup(!(partitionsSpec instanceof DynamicPartitionsSpec))
+        .withReportParseExceptions(false)
+        .withPushTimeout(5000L)
+        .build();
   }
 
   private static IndexSpec createIndexSpec()
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/TestIndexTask.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/TestIndexTask.java
index b4166b7bc29..c69ac562821 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/TestIndexTask.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/TestIndexTask.java
@@ -31,6 +31,7 @@ import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.indexing.common.actions.TaskAction;
 import org.apache.druid.indexing.common.task.IndexTask;
 import org.apache.druid.indexing.common.task.TaskResource;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.indexing.overlord.SegmentPublishResult;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.segment.IndexSpec;
@@ -69,34 +70,13 @@ public class TestIndexTask extends IndexTask
                 false,
                 false
             ),
-
-            new IndexTask.IndexTuningConfig(
-                null,
-                null,
-                null,
-                10,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                new DynamicPartitionsSpec(10000, null),
-                IndexSpec.DEFAULT,
-                null,
-                3,
-                false,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null
-            )
+            TuningConfigBuilder.forIndexTask()
+                               .withMaxRowsInMemory(10)
+                               .withIndexSpec(IndexSpec.DEFAULT)
+                               .withPartitionsSpec(new DynamicPartitionsSpec(10000, null))
+                               .withForceGuaranteedRollup(false)
+                               .withMaxPendingPersists(3)
+                               .build()
         ),
         null
     );
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java
index fcded3ab9ee..cd942a9a766 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/ClientCompactionTaskQuerySerdeTest.java
@@ -342,40 +342,27 @@ public class ClientCompactionTaskQuerySerdeTest
     )
         .inputSpec(new CompactionIntervalSpec(Intervals.of("2019/2020"), "testSha256OfSortedSegmentIds"), true)
         .tuningConfig(
-            new ParallelIndexTuningConfig(
-                null,
-                null,
-                new OnheapIncrementalIndex.Spec(true),
-                40000,
-                2000L,
-                null,
-                null,
-                null,
-                SEGMENTS_SPLIT_HINT_SPEC,
-                DYNAMIC_PARTITIONS_SPEC,
-                INDEX_SPEC,
-                INDEX_SPEC_FOR_INTERMEDIATE_PERSISTS,
-                2,
-                null,
-                null,
-                1000L,
-                TmpFileSegmentWriteOutMediumFactory.instance(),
-                null,
-                100,
-                5,
-                1000L,
-                new Duration(3000L),
-                7,
-                1000,
-                100,
-                null,
-                null,
-                null,
-                2,
-                null,
-                null,
-                null
-            )
+            TuningConfigBuilder
+                .forParallelIndexTask()
+                .withAppendableIndexSpec(new OnheapIncrementalIndex.Spec(true))
+                .withMaxRowsInMemory(40000)
+                .withMaxBytesInMemory(2000L)
+                .withSplitHintSpec(SEGMENTS_SPLIT_HINT_SPEC)
+                .withPartitionsSpec(DYNAMIC_PARTITIONS_SPEC)
+                .withIndexSpec(INDEX_SPEC)
+                .withIndexSpecForIntermediatePersists(INDEX_SPEC_FOR_INTERMEDIATE_PERSISTS)
+                .withMaxPendingPersists(2)
+                .withPushTimeout(1000L)
+                .withSegmentWriteOutMediumFactory(TmpFileSegmentWriteOutMediumFactory.instance())
+                .withMaxNumConcurrentSubTasks(100)
+                .withMaxRetry(5)
+                .withTaskStatusCheckPeriodMs(1000L)
+                .withChatHandlerTimeout(new Duration(3000L))
+                .withChatHandlerNumRetries(7)
+                .withMaxNumSegmentsToMerge(1000)
+                .withTotalNumMergeTasks(100)
+                .withMaxColumnsToMerge(2)
+                .build()
         )
         .granularitySpec(CLIENT_COMPACTION_TASK_GRANULARITY_SPEC)
         .dimensionsSpec(
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskRunTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskRunTest.java
index 54902d5f7c6..0c274a01966 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskRunTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskRunTest.java
@@ -51,7 +51,6 @@ import org.apache.druid.indexing.common.TestUtils;
 import org.apache.druid.indexing.common.config.TaskConfig;
 import org.apache.druid.indexing.common.config.TaskConfigBuilder;
 import org.apache.druid.indexing.common.task.CompactionTask.Builder;
-import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexTuningConfig;
 import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.ISE;
@@ -354,40 +353,10 @@ public class CompactionTaskRunTest extends IngestionTestBase
     final CompactionTask compactionTask = builder
         .interval(Intervals.of("2014-01-01/2014-01-02"))
         .tuningConfig(
-            new ParallelIndexTuningConfig(
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                new HashedPartitionsSpec(null, 3, null),
-                null,
-                null,
-                null,
-                true,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null
-            )
+            TuningConfigBuilder.forParallelIndexTask()
+                               .withForceGuaranteedRollup(true)
+                               .withPartitionsSpec(new HashedPartitionsSpec(null, 3, null))
+                               .build()
         )
         .build();
 
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
index b138a25469f..25dc84d98b7 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTaskTest.java
@@ -324,44 +324,21 @@ public class CompactionTaskTest
 
   private static CompactionTask.CompactionTuningConfig createTuningConfig()
   {
-    return new CompactionTask.CompactionTuningConfig(
-        null,
-        null, // null to compute maxRowsPerSegment automatically
-        null,
-        500000,
-        1000000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        true,
-        false,
-        5000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    return TuningConfigBuilder.forCompactionTask()
+        .withMaxRowsInMemory(500_000)
+        .withMaxBytesInMemory(1_000_000L)
+        .withIndexSpec(
+            IndexSpec.builder()
+                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                     .withDimensionCompression(CompressionStrategy.LZ4)
+                     .withMetricCompression(CompressionStrategy.LZF)
+                     .withLongEncoding(LongEncodingStrategy.LONGS)
+                     .build()
+        )
+        .withForceGuaranteedRollup(true)
+        .withReportParseExceptions(false)
+        .withPushTimeout(5000L)
+        .build();
   }
 
   @Rule
@@ -596,38 +573,21 @@ public class CompactionTaskTest
         null,
         null,
         null,
-        new IndexTuningConfig(
-            null,
-            null, // null to compute maxRowsPerSegment automatically
-            null,
-            500000,
-            1000000L,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            IndexSpec.builder()
-                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                     .withDimensionCompression(CompressionStrategy.LZ4)
-                     .withMetricCompression(CompressionStrategy.LZF)
-                     .withLongEncoding(LongEncodingStrategy.LONGS)
-                     .build(),
-            null,
-            null,
-            true,
-            false,
-            5000L,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
+        TuningConfigBuilder
+            .forIndexTask()
+            .withMaxRowsInMemory(500000)
+            .withIndexSpec(
+                IndexSpec.builder()
+                         .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                         .withDimensionCompression(CompressionStrategy.LZ4)
+                         .withMetricCompression(CompressionStrategy.LZF)
+                         .withLongEncoding(LongEncodingStrategy.LONGS)
+                         .build()
+            )
+            .withForceGuaranteedRollup(true)
+            .withReportParseExceptions(false)
+            .withPublishTimeout(5000L)
+            .build(),
         null,
         toolbox.getJsonMapper(),
         AuthTestUtils.TEST_AUTHORIZER_MAPPER,
@@ -676,77 +636,37 @@ public class CompactionTaskTest
   @Test
   public void testGetTuningConfigWithIndexTuningConfig()
   {
-    IndexTuningConfig indexTuningConfig = new IndexTuningConfig(
-        null,
-        null, // null to compute maxRowsPerSegment automatically
-        null,
-        500000,
-        1000000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        true,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    IndexTuningConfig indexTuningConfig = TuningConfigBuilder
+        .forIndexTask()
+        .withMaxRowsInMemory(500000)
+        .withMaxBytesInMemory(1000000L)
+        .withIndexSpec(
+            IndexSpec.builder()
+                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                     .withDimensionCompression(CompressionStrategy.LZ4)
+                     .withMetricCompression(CompressionStrategy.LZF)
+                     .withLongEncoding(LongEncodingStrategy.LONGS)
+                     .build()
+        )
+        .withForceGuaranteedRollup(true)
+        .withReportParseExceptions(false)
+        .build();
 
-    CompactionTask.CompactionTuningConfig compactionTuningConfig = new CompactionTask.CompactionTuningConfig(
-        null,
-        null,
-        null,
-        500000,
-        1000000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        true,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    CompactionTask.CompactionTuningConfig compactionTuningConfig = TuningConfigBuilder
+        .forCompactionTask()
+        .withMaxRowsInMemory(500000)
+        .withMaxBytesInMemory(1000000L)
+        .withIndexSpec(
+            IndexSpec.builder()
+                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                     .withDimensionCompression(CompressionStrategy.LZ4)
+                     .withMetricCompression(CompressionStrategy.LZF)
+                     .withLongEncoding(LongEncodingStrategy.LONGS)
+                     .build()
+        )
+        .withForceGuaranteedRollup(true)
+        .withReportParseExceptions(false)
+        .build();
 
     Assert.assertEquals(compactionTuningConfig, CompactionTask.getTuningConfig(indexTuningConfig));
 
@@ -755,84 +675,39 @@ public class CompactionTaskTest
   @Test
   public void testGetTuningConfigWithParallelIndexTuningConfig()
   {
-    ParallelIndexTuningConfig parallelIndexTuningConfig = new ParallelIndexTuningConfig(
-        null,
-        null, // null to compute maxRowsPerSegment automatically
-        null,
-        500000,
-        1000000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        true,
-        false,
-        5000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    ParallelIndexTuningConfig parallelIndexTuningConfig = TuningConfigBuilder
+        .forParallelIndexTask()
+        .withMaxRowsInMemory(500000)
+        .withMaxBytesInMemory(1000000L)
+        .withIndexSpec(
+            IndexSpec.builder()
+                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                     .withDimensionCompression(CompressionStrategy.LZ4)
+                     .withMetricCompression(CompressionStrategy.LZF)
+                     .withLongEncoding(LongEncodingStrategy.LONGS)
+                     .build()
+        )
+        .withForceGuaranteedRollup(true)
+        .withReportParseExceptions(false)
+        .withPushTimeout(5000L)
+        .build();
 
-    CompactionTask.CompactionTuningConfig compactionTuningConfig = new CompactionTask.CompactionTuningConfig(
-        null,
-        null, // null to compute maxRowsPerSegment automatically
-        null,
-        500000,
-        1000000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        true,
-        false,
-        5000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    CompactionTask.CompactionTuningConfig compactionTuningConfig = TuningConfigBuilder
+        .forCompactionTask()
+        .withMaxRowsInMemory(500000)
+        .withMaxBytesInMemory(1000000L)
+        .withIndexSpec(
+            IndexSpec.builder()
+                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                     .withDimensionCompression(CompressionStrategy.LZ4)
+                     .withMetricCompression(CompressionStrategy.LZF)
+                     .withLongEncoding(LongEncodingStrategy.LONGS)
+                     .build()
+        )
+        .withForceGuaranteedRollup(true)
+        .withReportParseExceptions(false)
+        .withPushTimeout(5000L)
+        .build();
 
     Assert.assertEquals(compactionTuningConfig, CompactionTask.getTuningConfig(parallelIndexTuningConfig));
   }
@@ -909,44 +784,24 @@ public class CompactionTaskTest
   @Test
   public void testCreateIngestionSchemaWithTargetPartitionSize() throws IOException
   {
-    final CompactionTask.CompactionTuningConfig tuningConfig = new CompactionTask.CompactionTuningConfig(
-        100000,
-        null,
-        null,
-        500000,
-        1000000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        true,
-        false,
-        null,
-        null,
-        null,
-        10,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    final CompactionTask.CompactionTuningConfig tuningConfig = TuningConfigBuilder
+        .forCompactionTask()
+        .withTargetPartitionSize(100000)
+        .withMaxRowsInMemory(500000)
+        .withMaxBytesInMemory(1000000L)
+        .withIndexSpec(
+            IndexSpec.builder()
+                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                     .withDimensionCompression(CompressionStrategy.LZ4)
+                     .withMetricCompression(CompressionStrategy.LZF)
+                     .withLongEncoding(LongEncodingStrategy.LONGS)
+                     .build()
+        )
+        .withForceGuaranteedRollup(true)
+        .withReportParseExceptions(false)
+        .withMaxNumConcurrentSubTasks(10)
+        .build();
+
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         toolbox,
         LockGranularity.TIME_CHUNK,
@@ -991,44 +846,24 @@ public class CompactionTaskTest
   @Test
   public void testCreateIngestionSchemaWithMaxTotalRows() throws IOException
   {
-    final CompactionTask.CompactionTuningConfig tuningConfig = new CompactionTask.CompactionTuningConfig(
-        null,
-        null,
-        null,
-        500000,
-        1000000L,
-        null,
-        1000000L,
-        null,
-        null,
-        null,
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        false,
-        false,
-        5000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    final CompactionTask.CompactionTuningConfig tuningConfig = TuningConfigBuilder
+        .forCompactionTask()
+        .withMaxRowsInMemory(500000)
+        .withMaxBytesInMemory(1000000L)
+        .withMaxTotalRows(1000000L)
+        .withIndexSpec(
+            IndexSpec.builder()
+                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                     .withDimensionCompression(CompressionStrategy.LZ4)
+                     .withMetricCompression(CompressionStrategy.LZF)
+                     .withLongEncoding(LongEncodingStrategy.LONGS)
+                     .build()
+        )
+        .withForceGuaranteedRollup(false)
+        .withReportParseExceptions(false)
+        .withPushTimeout(5000L)
+        .build();
+
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         toolbox,
         LockGranularity.TIME_CHUNK,
@@ -1073,44 +908,25 @@ public class CompactionTaskTest
   @Test
   public void testCreateIngestionSchemaWithNumShards() throws IOException
   {
-    final CompactionTask.CompactionTuningConfig tuningConfig = new CompactionTask.CompactionTuningConfig(
-        null,
-        null,
-        null,
-        500000,
-        1000000L,
-        null,
-        null,
-        null,
-        null,
-        new HashedPartitionsSpec(null, 3, null),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        true,
-        false,
-        5000L,
-        null,
-        null,
-        10,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    final CompactionTask.CompactionTuningConfig tuningConfig = TuningConfigBuilder
+        .forCompactionTask()
+        .withMaxRowsInMemory(500000)
+        .withMaxBytesInMemory(1000000L)
+        .withPartitionsSpec(new HashedPartitionsSpec(null, 3, null))
+        .withIndexSpec(
+            IndexSpec.builder()
+                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                     .withDimensionCompression(CompressionStrategy.LZ4)
+                     .withMetricCompression(CompressionStrategy.LZF)
+                     .withLongEncoding(LongEncodingStrategy.LONGS)
+                     .build()
+        )
+        .withForceGuaranteedRollup(true)
+        .withReportParseExceptions(false)
+        .withPushTimeout(5000L)
+        .withMaxNumConcurrentSubTasks(10)
+        .build();
+
     final Map<Interval, DataSchema> dataSchemasForIntervals = CompactionTask.createDataSchemasForIntervals(
         toolbox,
         LockGranularity.TIME_CHUNK,
@@ -1821,44 +1637,24 @@ public class CompactionTaskTest
         expectedDimensionsSpecs,
         expectedMetricsSpec,
         expectedSegmentIntervals,
-        new CompactionTask.CompactionTuningConfig(
-            null,
-            null,
-            null,
-            500000,
-            1000000L,
-            null,
-            Long.MAX_VALUE,
-            null,
-            null,
-            new HashedPartitionsSpec(5000000, null, null), // automatically computed targetPartitionSize
-            IndexSpec.builder()
-                     .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                     .withDimensionCompression(CompressionStrategy.LZ4)
-                     .withMetricCompression(CompressionStrategy.LZF)
-                     .withLongEncoding(LongEncodingStrategy.LONGS)
-                     .build(),
-            null,
-            null,
-            true,
-            false,
-            5000L,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
+        TuningConfigBuilder
+            .forCompactionTask()
+            .withMaxRowsInMemory(500000)
+            .withMaxBytesInMemory(1000000L)
+            .withMaxTotalRows(Long.MAX_VALUE)
+            .withPartitionsSpec(new HashedPartitionsSpec(5000000, null, null))
+            .withIndexSpec(
+                IndexSpec.builder()
+                         .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                         .withDimensionCompression(CompressionStrategy.LZ4)
+                         .withMetricCompression(CompressionStrategy.LZF)
+                         .withLongEncoding(LongEncodingStrategy.LONGS)
+                         .build()
+            )
+            .withForceGuaranteedRollup(true)
+            .withReportParseExceptions(false)
+            .withPushTimeout(5000L)
+            .build(),
         expectedSegmentGranularity,
         expectedQueryGranularity,
         expectedDropExisting
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTuningConfigTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTuningConfigTest.java
index 6831ea4adb6..a342dab8230 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTuningConfigTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/CompactionTuningConfigTest.java
@@ -22,21 +22,14 @@ package org.apache.druid.indexing.common.task;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.fasterxml.jackson.databind.jsontype.NamedType;
 import nl.jqno.equalsverifier.EqualsVerifier;
-import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexTuningConfig;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.segment.IndexSpec;
-import org.apache.druid.segment.data.CompressionFactory.LongEncodingStrategy;
 import org.apache.druid.segment.data.CompressionStrategy;
-import org.apache.druid.segment.data.RoaringBitmapSerdeFactory;
 import org.apache.druid.segment.indexing.TuningConfig;
-import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
-import org.joda.time.Duration;
 import org.junit.Assert;
 import org.junit.Before;
-import org.junit.Rule;
 import org.junit.Test;
-import org.junit.rules.ExpectedException;
 
 import java.io.IOException;
 
@@ -44,9 +37,6 @@ public class CompactionTuningConfigTest
 {
   private final ObjectMapper mapper = new DefaultObjectMapper();
 
-  @Rule
-  public ExpectedException expectedException = ExpectedException.none();
-
   @Before
   public void setup()
   {
@@ -56,142 +46,44 @@ public class CompactionTuningConfigTest
   @Test
   public void testSerdeDefault() throws IOException
   {
-    final CompactionTask.CompactionTuningConfig tuningConfig = CompactionTask.CompactionTuningConfig.defaultConfig();
+    final CompactionTask.CompactionTuningConfig tuningConfig =
+        CompactionTask.CompactionTuningConfig.defaultConfig();
     final byte[] json = mapper.writeValueAsBytes(tuningConfig);
-    final ParallelIndexTuningConfig fromJson = (CompactionTask.CompactionTuningConfig) mapper.readValue(json, TuningConfig.class);
+    final ParallelIndexTuningConfig fromJson =
+        (CompactionTask.CompactionTuningConfig) mapper.readValue(json, TuningConfig.class);
     Assert.assertEquals(fromJson, tuningConfig);
   }
 
   @Test
-  public void testSerdeWithNonZeroAwaitSegmentAvailabilityTimeoutMillis()
+  public void testConfigWithNonZeroAwaitSegmentAvailabilityTimeoutThrowsException()
   {
-    expectedException.expect(IllegalArgumentException.class);
-    expectedException.expectMessage("awaitSegmentAvailabilityTimeoutMillis is not supported for Compcation Task");
-    final CompactionTask.CompactionTuningConfig tuningConfig = new CompactionTask.CompactionTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(100, 100L),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        false,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        null,
-        250,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        5L,
-        null
+    final Exception e = Assert.assertThrows(
+        IllegalArgumentException.class,
+        () -> TuningConfigBuilder.forCompactionTask()
+                                 .withAwaitSegmentAvailabilityTimeoutMillis(5L)
+                                 .build()
+    );
+    Assert.assertEquals(
+        "awaitSegmentAvailabilityTimeoutMillis is not supported for Compcation Task",
+        e.getMessage()
     );
   }
 
   @Test
-  public void testSerdeWithZeroAwaitSegmentAvailabilityTimeoutMillis()
+  public void testConfigWithZeroAwaitSegmentAvailabilityTimeoutMillis()
   {
-    final CompactionTask.CompactionTuningConfig tuningConfig = new CompactionTask.CompactionTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(100, 100L),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        false,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        null,
-        250,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        0L,
-        null
-    );
+    final CompactionTask.CompactionTuningConfig tuningConfig = TuningConfigBuilder
+        .forCompactionTask()
+        .withAwaitSegmentAvailabilityTimeoutMillis(0L)
+        .build();
     Assert.assertEquals(0L, tuningConfig.getAwaitSegmentAvailabilityTimeoutMillis());
   }
 
   @Test
-  public void testSerdeWithNullAwaitSegmentAvailabilityTimeoutMillis()
+  public void testDefaultAwaitSegmentAvailabilityTimeoutMillis()
   {
-    final CompactionTask.CompactionTuningConfig tuningConfig = new CompactionTask.CompactionTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(100, 100L),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        false,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        null,
-        250,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    final CompactionTask.CompactionTuningConfig tuningConfig =
+        TuningConfigBuilder.forCompactionTask().build();
     Assert.assertEquals(0L, tuningConfig.getAwaitSegmentAvailabilityTimeoutMillis());
   }
 
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskSerdeTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskSerdeTest.java
index 40d9cb4919f..493f6b47756 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskSerdeTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskSerdeTest.java
@@ -56,114 +56,38 @@ public class IndexTaskSerdeTest
   @Test
   public void testSerdeTuningConfigWithDynamicPartitionsSpec() throws IOException
   {
-    final IndexTuningConfig tuningConfig = new IndexTuningConfig(
-        null,
-        null,
-        null,
-        100,
-        2000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(1000, 2000L),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        false,
-        null,
-        null,
-        100L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        true,
-        10,
-        100,
-        1234,
-        0L,
-        null
-    );
+    final IndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forIndexTask()
+        .withPartitionsSpec(new DynamicPartitionsSpec(1000, 2000L))
+        .withForceGuaranteedRollup(false)
+        .build();
     assertSerdeTuningConfig(tuningConfig);
   }
 
   @Test
   public void testSerdeTuningConfigWithHashedPartitionsSpec() throws IOException
   {
-    final IndexTuningConfig tuningConfig = new IndexTuningConfig(
-        null,
-        null,
-        null,
-        100,
-        2000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        new HashedPartitionsSpec(null, 10, ImmutableList.of("dim1", "dim2")),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        true,
-        null,
-        null,
-        100L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        true,
-        10,
-        100,
-        null,
-        -1L,
-        null
-    );
+    final IndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forIndexTask()
+        .withPartitionsSpec(new HashedPartitionsSpec(null, 10, null))
+        .withForceGuaranteedRollup(true)
+        .build();
     assertSerdeTuningConfig(tuningConfig);
   }
 
   @Test
   public void testSerdeTuningConfigWithDeprecatedDynamicPartitionsSpec() throws IOException
   {
-    final IndexTuningConfig tuningConfig = new IndexTuningConfig(
-        null,
-        1000,
-        null,
-        100,
-        2000L,
-        null,
-        3000L,
-        null,
-        null,
-        null,
-        null,
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        false,
-        null,
-        null,
-        100L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        true,
-        10,
-        100,
-        null,
-        1L,
-        null
-    );
+    final IndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forIndexTask()
+        .withMaxRowsPerSegment(1000)
+        .withMaxRowsInMemory(100)
+        .withMaxBytesInMemory(2000L)
+        .withMaxTotalRows(3000L)
+        .withForceGuaranteedRollup(false)
+        .withPushTimeout(100L)
+        .withAwaitSegmentAvailabilityTimeoutMillis(1L)
+        .build();
     assertSerdeTuningConfig(tuningConfig);
   }
 
@@ -210,38 +134,10 @@ public class IndexTaskSerdeTest
   {
     expectedException.expect(IllegalArgumentException.class);
     expectedException.expectMessage("DynamicPartitionsSpec cannot be used for perfect rollup");
-    final IndexTuningConfig tuningConfig = new IndexTuningConfig(
-        null,
-        null,
-        null,
-        100,
-        2000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(1000, 2000L),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        true,
-        null,
-        null,
-        100L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        true,
-        10,
-        100,
-        null,
-        null,
-        null
-    );
+    TuningConfigBuilder.forIndexTask()
+                       .withForceGuaranteedRollup(true)
+                       .withPartitionsSpec(new DynamicPartitionsSpec(1000, 2000L))
+                       .build();
   }
 
   @Test
@@ -249,38 +145,10 @@ public class IndexTaskSerdeTest
   {
     expectedException.expect(IllegalArgumentException.class);
     expectedException.expectMessage("DynamicPartitionsSpec must be used for best-effort rollup");
-    final IndexTuningConfig tuningConfig = new IndexTuningConfig(
-        null,
-        null,
-        null,
-        100,
-        2000L,
-        null,
-        null,
-        null,
-        null,
-        null,
-        new HashedPartitionsSpec(null, 10, ImmutableList.of("dim1", "dim2")),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.LZ4)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        null,
-        null,
-        false,
-        null,
-        null,
-        100L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        true,
-        10,
-        100,
-        null,
-        null,
-        null
-    );
+    TuningConfigBuilder.forIndexTask()
+                       .withForceGuaranteedRollup(false)
+                       .withPartitionsSpec(new HashedPartitionsSpec(null, 10, null))
+                       .build();
   }
 
   private static void assertSerdeTuningConfig(IndexTuningConfig tuningConfig) throws IOException
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java
index 1a5cf19a21a..40be3844585 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IndexTaskTest.java
@@ -1499,33 +1499,16 @@ public class IndexTaskTest extends IngestionTestBase
       writer.write("this is not JSON\n"); // invalid JSON
     }
 
-    final IndexTuningConfig tuningConfig = new IndexTuningConfig(
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        new HashedPartitionsSpec(2, null, null),
-        INDEX_SPEC,
-        null,
-        null,
-        true,
-        false,
-        null,
-        null,
-        null,
-        true,
-        7,
-        7,
-        null,
-        null,
-        null
-    );
+    final IndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forIndexTask()
+        .withPartitionsSpec(new HashedPartitionsSpec(2, null, null))
+        .withIndexSpec(INDEX_SPEC)
+        .withForceGuaranteedRollup(true)
+        .withReportParseExceptions(false)
+        .withLogParseExceptions(true)
+        .withMaxParseExceptions(7)
+        .withMaxSavedParseExceptions(7)
+        .build();
 
     final TimestampSpec timestampSpec = new TimestampSpec("time", "auto", null);
     final DimensionsSpec dimensionsSpec = new DimensionsSpec(
@@ -1668,33 +1651,16 @@ public class IndexTaskTest extends IngestionTestBase
     }
 
     // Allow up to 3 parse exceptions, and save up to 2 parse exceptions
-    final IndexTuningConfig tuningConfig = new IndexTuningConfig(
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(2, null),
-        INDEX_SPEC,
-        null,
-        null,
-        false,
-        false,
-        null,
-        null,
-        null,
-        true,
-        2,
-        5,
-        null,
-        null,
-        null
-    );
+    final IndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forIndexTask()
+        .withPartitionsSpec(new DynamicPartitionsSpec(2, null))
+        .withIndexSpec(INDEX_SPEC)
+        .withForceGuaranteedRollup(false)
+        .withReportParseExceptions(false)
+        .withLogParseExceptions(true)
+        .withMaxParseExceptions(2)
+        .withMaxSavedParseExceptions(5)
+        .build();
 
     final TimestampSpec timestampSpec = new TimestampSpec("time", "auto", null);
     final DimensionsSpec dimensionsSpec = new DimensionsSpec(
@@ -1804,33 +1770,16 @@ public class IndexTaskTest extends IngestionTestBase
     }
 
     // Allow up to 3 parse exceptions, and save up to 2 parse exceptions
-    final IndexTuningConfig tuningConfig = new IndexTuningConfig(
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        new HashedPartitionsSpec(2, null, null),
-        INDEX_SPEC,
-        null,
-        null,
-        true,
-        false,
-        null,
-        null,
-        null,
-        true,
-        2,
-        5,
-        null,
-        null,
-        null
-    );
+    final IndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forIndexTask()
+        .withPartitionsSpec(new HashedPartitionsSpec(2, null, null))
+        .withIndexSpec(INDEX_SPEC)
+        .withForceGuaranteedRollup(true)
+        .withReportParseExceptions(false)
+        .withLogParseExceptions(true)
+        .withMaxParseExceptions(2)
+        .withMaxSavedParseExceptions(5)
+        .build();
 
     final TimestampSpec timestampSpec = new TimestampSpec("time", "auto", null);
     final DimensionsSpec dimensionsSpec = new DimensionsSpec(
@@ -2611,33 +2560,17 @@ public class IndexTaskTest extends IngestionTestBase
       boolean reportParseException
   )
   {
-    return new IndexTuningConfig(
-        null,
-        maxRowsPerSegment,
-        null,
-        maxRowsInMemory,
-        null,
-        null,
-        maxTotalRows,
-        null,
-        null,
-        null,
-        partitionsSpec,
-        INDEX_SPEC,
-        null,
-        null,
-        forceGuaranteedRollup,
-        reportParseException,
-        null,
-        null,
-        null,
-        null,
-        null,
-        1,
-        null,
-        null,
-        null
-    );
+    return TuningConfigBuilder
+        .forIndexTask()
+        .withMaxRowsPerSegment(maxRowsPerSegment)
+        .withMaxRowsInMemory(maxRowsInMemory)
+        .withMaxTotalRows(maxTotalRows)
+        .withPartitionsSpec(partitionsSpec)
+        .withIndexSpec(INDEX_SPEC)
+        .withForceGuaranteedRollup(forceGuaranteedRollup)
+        .withReportParseExceptions(reportParseException)
+        .withMaxSavedParseExceptions(1)
+        .build();
   }
 
   @SuppressWarnings("unchecked")
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TaskSerdeTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TaskSerdeTest.java
index b217f8d5bd8..9cf6c0102fb 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TaskSerdeTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TaskSerdeTest.java
@@ -243,33 +243,14 @@ public class TaskSerdeTest
                 null
             ),
             new IndexIOConfig(null, new LocalInputSource(new File("lol"), "rofl"), new NoopInputFormat(), true, false),
-            new IndexTuningConfig(
-                null,
-                null,
-                null,
-                10,
-                null,
-                null,
-                null,
-                9999,
-                null,
-                null,
-                new DynamicPartitionsSpec(10000, null),
-                indexSpec,
-                null,
-                3,
-                false,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                1L,
-                null
-            )
+            TuningConfigBuilder.forIndexTask()
+                               .withMaxRowsInMemory(10)
+                               .withPartitionsSpec(new DynamicPartitionsSpec(10000, null))
+                               .withIndexSpec(indexSpec)
+                               .withMaxPendingPersists(3)
+                               .withForceGuaranteedRollup(false)
+                               .withAwaitSegmentAvailabilityTimeoutMillis(1L)
+                               .build()
         ),
         null
     );
@@ -330,33 +311,13 @@ public class TaskSerdeTest
                 null
             ),
             new IndexIOConfig(null, new LocalInputSource(new File("lol"), "rofl"), new NoopInputFormat(), true, false),
-            new IndexTuningConfig(
-                null,
-                null,
-                null,
-                10,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                new DynamicPartitionsSpec(10000, null),
-                indexSpec,
-                null,
-                3,
-                false,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null
-            )
+            TuningConfigBuilder.forIndexTask()
+                               .withMaxRowsInMemory(10)
+                               .withForceGuaranteedRollup(false)
+                               .withPartitionsSpec(new DynamicPartitionsSpec(10000, null))
+                               .withIndexSpec(indexSpec)
+                               .withMaxPendingPersists(3)
+                               .build()
         ),
         null
     );
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TuningConfigBuilder.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TuningConfigBuilder.java
new file mode 100644
index 00000000000..c46c0becc76
--- /dev/null
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TuningConfigBuilder.java
@@ -0,0 +1,415 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.task;
+
+import org.apache.druid.data.input.SplitHintSpec;
+import org.apache.druid.indexer.partitions.PartitionsSpec;
+import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexTuningConfig;
+import org.apache.druid.segment.IndexSpec;
+import org.apache.druid.segment.incremental.AppendableIndexSpec;
+import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
+import org.joda.time.Duration;
+
+/**
+ * Builder utility for various task tuning configs.
+ *
+ * @param <C> Type of config that is being built
+ * @see TuningConfigBuilder#forIndexTask()
+ * @see TuningConfigBuilder#forParallelIndexTask()
+ * @see TuningConfigBuilder#forCompactionTask()
+ */
+public abstract class TuningConfigBuilder<C>
+{
+  protected Integer targetPartitionSize;
+  protected Integer maxRowsPerSegment;
+  protected AppendableIndexSpec appendableIndexSpec;
+  protected Integer maxRowsInMemory;
+  protected Long maxBytesInMemory;
+  protected Boolean skipBytesInMemoryOverheadCheck;
+  protected Long maxTotalRows;
+  protected Integer numShards;
+  protected SplitHintSpec splitHintSpec;
+  protected PartitionsSpec partitionsSpec;
+  protected IndexSpec indexSpec;
+  protected IndexSpec indexSpecForIntermediatePersists;
+  protected Integer maxPendingPersists;
+  protected Boolean forceGuaranteedRollup;
+  protected Boolean reportParseExceptions;
+  protected Long publishTimeout;
+  protected Long pushTimeout;
+  protected SegmentWriteOutMediumFactory segmentWriteOutMediumFactory;
+  protected Integer maxNumSubTasks;
+  protected Integer maxNumConcurrentSubTasks;
+  protected Integer maxRetry;
+  protected Long taskStatusCheckPeriodMs;
+  protected Duration chatHandlerTimeout;
+  protected Integer chatHandlerNumRetries;
+  protected Integer maxNumSegmentsToMerge;
+  protected Integer totalNumMergeTasks;
+  protected Boolean logParseExceptions;
+  protected Integer maxParseExceptions;
+  protected Integer maxSavedParseExceptions;
+  protected Integer maxColumnsToMerge;
+  protected Long awaitSegmentAvailabilityTimeoutMillis;
+  protected Integer maxAllowedLockCount;
+  protected Integer numPersistThreads;
+
+  public TuningConfigBuilder<C> withTargetPartitionSize(Integer targetPartitionSize)
+  {
+    this.targetPartitionSize = targetPartitionSize;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxRowsPerSegment(Integer maxRowsPerSegment)
+  {
+    this.maxRowsPerSegment = maxRowsPerSegment;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withAppendableIndexSpec(AppendableIndexSpec appendableIndexSpec)
+  {
+    this.appendableIndexSpec = appendableIndexSpec;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxRowsInMemory(Integer maxRowsInMemory)
+  {
+    this.maxRowsInMemory = maxRowsInMemory;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxBytesInMemory(Long maxBytesInMemory)
+  {
+    this.maxBytesInMemory = maxBytesInMemory;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withSkipBytesInMemoryOverheadCheck(Boolean skipBytesInMemoryOverheadCheck)
+  {
+    this.skipBytesInMemoryOverheadCheck = skipBytesInMemoryOverheadCheck;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxTotalRows(Long maxTotalRows)
+  {
+    this.maxTotalRows = maxTotalRows;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withNumShards(Integer numShards)
+  {
+    this.numShards = numShards;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withSplitHintSpec(SplitHintSpec splitHintSpec)
+  {
+    this.splitHintSpec = splitHintSpec;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withPartitionsSpec(PartitionsSpec partitionsSpec)
+  {
+    this.partitionsSpec = partitionsSpec;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withIndexSpec(IndexSpec indexSpec)
+  {
+    this.indexSpec = indexSpec;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withIndexSpecForIntermediatePersists(IndexSpec indexSpecForIntermediatePersists)
+  {
+    this.indexSpecForIntermediatePersists = indexSpecForIntermediatePersists;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxPendingPersists(Integer maxPendingPersists)
+  {
+    this.maxPendingPersists = maxPendingPersists;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withForceGuaranteedRollup(Boolean forceGuaranteedRollup)
+  {
+    this.forceGuaranteedRollup = forceGuaranteedRollup;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withReportParseExceptions(Boolean reportParseExceptions)
+  {
+    this.reportParseExceptions = reportParseExceptions;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withPushTimeout(Long pushTimeout)
+  {
+    this.pushTimeout = pushTimeout;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withPublishTimeout(Long publishTimeout)
+  {
+    this.publishTimeout = publishTimeout;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withSegmentWriteOutMediumFactory(SegmentWriteOutMediumFactory segmentWriteOutMediumFactory)
+  {
+    this.segmentWriteOutMediumFactory = segmentWriteOutMediumFactory;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxNumSubTasks(Integer maxNumSubTasks)
+  {
+    this.maxNumSubTasks = maxNumSubTasks;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxNumConcurrentSubTasks(Integer maxNumConcurrentSubTasks)
+  {
+    this.maxNumConcurrentSubTasks = maxNumConcurrentSubTasks;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxRetry(Integer maxRetry)
+  {
+    this.maxRetry = maxRetry;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withTaskStatusCheckPeriodMs(Long taskStatusCheckPeriodMs)
+  {
+    this.taskStatusCheckPeriodMs = taskStatusCheckPeriodMs;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withChatHandlerTimeout(Duration chatHandlerTimeout)
+  {
+    this.chatHandlerTimeout = chatHandlerTimeout;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withChatHandlerNumRetries(Integer chatHandlerNumRetries)
+  {
+    this.chatHandlerNumRetries = chatHandlerNumRetries;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxNumSegmentsToMerge(Integer maxNumSegmentsToMerge)
+  {
+    this.maxNumSegmentsToMerge = maxNumSegmentsToMerge;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withTotalNumMergeTasks(Integer totalNumMergeTasks)
+  {
+    this.totalNumMergeTasks = totalNumMergeTasks;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withLogParseExceptions(Boolean logParseExceptions)
+  {
+    this.logParseExceptions = logParseExceptions;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxParseExceptions(Integer maxParseExceptions)
+  {
+    this.maxParseExceptions = maxParseExceptions;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxSavedParseExceptions(Integer maxSavedParseExceptions)
+  {
+    this.maxSavedParseExceptions = maxSavedParseExceptions;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxColumnsToMerge(Integer maxColumnsToMerge)
+  {
+    this.maxColumnsToMerge = maxColumnsToMerge;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withAwaitSegmentAvailabilityTimeoutMillis(Long awaitSegmentAvailabilityTimeoutMillis)
+  {
+    this.awaitSegmentAvailabilityTimeoutMillis = awaitSegmentAvailabilityTimeoutMillis;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withNumPersistThreads(Integer numPersistThreads)
+  {
+    this.numPersistThreads = numPersistThreads;
+    return this;
+  }
+
+  public TuningConfigBuilder<C> withMaxAllowedLockCount(Integer maxAllowedLockCount)
+  {
+    this.maxAllowedLockCount = maxAllowedLockCount;
+    return this;
+  }
+
+  public abstract C build();
+
+  /**
+   * Creates a new builder for {@link CompactionTask.CompactionTuningConfig}.
+   */
+  public static Compact forCompactionTask()
+  {
+    return new Compact();
+  }
+
+  /**
+   * Creates a new builder for {@link ParallelIndexTuningConfig}.
+   */
+  public static ParallelIndex forParallelIndexTask()
+  {
+    return new ParallelIndex();
+  }
+
+  /**
+   * Creates a new builder for {@link IndexTask.IndexTuningConfig}.
+   */
+  public static Index forIndexTask()
+  {
+    return new Index();
+  }
+
+  public static class Index extends TuningConfigBuilder<IndexTask.IndexTuningConfig>
+  {
+    @Override
+    public IndexTask.IndexTuningConfig build()
+    {
+      return new IndexTask.IndexTuningConfig(
+          targetPartitionSize,
+          maxRowsPerSegment,
+          appendableIndexSpec,
+          maxRowsInMemory,
+          maxBytesInMemory,
+          skipBytesInMemoryOverheadCheck,
+          maxTotalRows,
+          null,
+          numShards,
+          null,
+          partitionsSpec,
+          indexSpec,
+          indexSpecForIntermediatePersists,
+          maxPendingPersists,
+          forceGuaranteedRollup,
+          reportParseExceptions,
+          publishTimeout,
+          pushTimeout,
+          segmentWriteOutMediumFactory,
+          logParseExceptions,
+          maxParseExceptions,
+          maxSavedParseExceptions,
+          maxColumnsToMerge,
+          awaitSegmentAvailabilityTimeoutMillis,
+          numPersistThreads
+      );
+    }
+  }
+
+  public static class ParallelIndex extends TuningConfigBuilder<ParallelIndexTuningConfig>
+  {
+    @Override
+    public ParallelIndexTuningConfig build()
+    {
+      return new ParallelIndexTuningConfig(
+          targetPartitionSize,
+          maxRowsPerSegment,
+          appendableIndexSpec,
+          maxRowsInMemory,
+          maxBytesInMemory,
+          skipBytesInMemoryOverheadCheck,
+          maxTotalRows,
+          numShards,
+          splitHintSpec,
+          partitionsSpec,
+          indexSpec,
+          indexSpecForIntermediatePersists,
+          maxPendingPersists,
+          forceGuaranteedRollup,
+          reportParseExceptions,
+          pushTimeout,
+          segmentWriteOutMediumFactory,
+          maxNumSubTasks,
+          maxNumConcurrentSubTasks,
+          maxRetry,
+          taskStatusCheckPeriodMs,
+          chatHandlerTimeout,
+          chatHandlerNumRetries,
+          maxNumSegmentsToMerge,
+          totalNumMergeTasks,
+          logParseExceptions,
+          maxParseExceptions,
+          maxSavedParseExceptions,
+          maxColumnsToMerge,
+          awaitSegmentAvailabilityTimeoutMillis,
+          maxAllowedLockCount,
+          numPersistThreads
+      );
+    }
+  }
+
+  public static class Compact extends TuningConfigBuilder<CompactionTask.CompactionTuningConfig>
+  {
+    @Override
+    public CompactionTask.CompactionTuningConfig build()
+    {
+      return new CompactionTask.CompactionTuningConfig(
+          targetPartitionSize,
+          maxRowsPerSegment,
+          appendableIndexSpec,
+          maxRowsInMemory,
+          maxBytesInMemory,
+          skipBytesInMemoryOverheadCheck,
+          maxTotalRows,
+          numShards,
+          splitHintSpec,
+          partitionsSpec,
+          indexSpec,
+          indexSpecForIntermediatePersists,
+          maxPendingPersists,
+          forceGuaranteedRollup,
+          reportParseExceptions,
+          pushTimeout,
+          segmentWriteOutMediumFactory,
+          maxNumSubTasks,
+          maxNumConcurrentSubTasks,
+          maxRetry,
+          taskStatusCheckPeriodMs,
+          chatHandlerTimeout,
+          chatHandlerNumRetries,
+          maxNumSegmentsToMerge,
+          totalNumMergeTasks,
+          logParseExceptions,
+          maxParseExceptions,
+          maxSavedParseExceptions,
+          maxColumnsToMerge,
+          awaitSegmentAvailabilityTimeoutMillis,
+          numPersistThreads
+      );
+    }
+  }
+}
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/AbstractParallelIndexSupervisorTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/AbstractParallelIndexSupervisorTaskTest.java
index 8f68846cd64..ea6f9d963fe 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/AbstractParallelIndexSupervisorTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/AbstractParallelIndexSupervisorTaskTest.java
@@ -66,6 +66,7 @@ import org.apache.druid.indexing.common.task.IngestionTestBase;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.indexing.common.task.Tasks;
 import org.apache.druid.indexing.common.task.TestAppenderatorsManager;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.indexing.worker.config.WorkerConfig;
 import org.apache.druid.indexing.worker.shuffle.IntermediaryDataManager;
@@ -165,40 +166,10 @@ public class AbstractParallelIndexSupervisorTaskTest extends IngestionTestBase
       0
   );
   public static final ParallelIndexTuningConfig DEFAULT_TUNING_CONFIG_FOR_PARALLEL_INDEXING =
-      new ParallelIndexTuningConfig(
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          2,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          5,
-          null,
-          null,
-          null,
-          null
-      );
+      TuningConfigBuilder.forParallelIndexTask()
+                         .withMaxNumConcurrentSubTasks(2)
+                         .withMaxSavedParseExceptions(5)
+                         .build();
 
   protected static final double DEFAULT_TRANSIENT_TASK_FAILURE_RATE = 0.2;
   protected static final double DEFAULT_TRANSIENT_API_FAILURE_RATE = 0.2;
@@ -276,40 +247,13 @@ public class AbstractParallelIndexSupervisorTaskTest extends IngestionTestBase
       boolean forceGuaranteedRollup
   )
   {
-    return new ParallelIndexTuningConfig(
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        new MaxSizeSplitHintSpec(null, 1),
-        partitionsSpec,
-        null,
-        null,
-        null,
-        forceGuaranteedRollup,
-        null,
-        null,
-        null,
-        null,
-        maxNumConcurrentSubTasks,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        5,
-        null,
-        null,
-        null,
-        null
-    );
+    return TuningConfigBuilder.forParallelIndexTask()
+                              .withSplitHintSpec(new MaxSizeSplitHintSpec(null, 1))
+                              .withPartitionsSpec(partitionsSpec)
+                              .withForceGuaranteedRollup(forceGuaranteedRollup)
+                              .withMaxNumConcurrentSubTasks(maxNumConcurrentSubTasks)
+                              .withMaxParseExceptions(5)
+                              .build();
   }
 
   protected LocalOverlordClient getIndexingServiceClient()
@@ -329,12 +273,10 @@ public class AbstractParallelIndexSupervisorTaskTest extends IngestionTestBase
     private volatile Future<TaskStatus> statusFuture;
     @MonotonicNonNull
     private volatile TestLocalTaskActionClient actionClient;
-    private final CountDownLatch taskFinishLatch;
 
-    private TaskContainer(Task task, CountDownLatch taskFinishLatch)
+    private TaskContainer(Task task)
     {
       this.task = task;
-      this.taskFinishLatch = taskFinishLatch;
     }
 
     public Task getTask()
@@ -461,7 +403,7 @@ public class AbstractParallelIndexSupervisorTaskTest extends IngestionTestBase
       final CountDownLatch taskFinishLatch = useTaskFinishLatches ? new CountDownLatch(1) : new CountDownLatch(0);
       allTaskLatches.add(taskFinishLatch);
 
-      final TaskContainer taskContainer = new TaskContainer(task, taskFinishLatch);
+      final TaskContainer taskContainer = new TaskContainer(task);
       if (tasks.put(task.getId(), taskContainer) != null) {
         throw new ISE("Duplicate task ID[%s]", task.getId());
       }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskKillTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskKillTest.java
index 14e1bab9540..e85df4fe5dd 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskKillTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskKillTest.java
@@ -32,6 +32,7 @@ import org.apache.druid.indexer.TaskStatusPlus;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.actions.TaskActionClient;
 import org.apache.druid.indexing.common.task.TaskResource;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.Pair;
 import org.apache.druid.java.util.common.granularity.Granularities;
@@ -163,40 +164,7 @@ public class ParallelIndexSupervisorTaskKillTest extends AbstractParallelIndexSu
             null
         ),
         ioConfig,
-        new ParallelIndexTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            numTotalSubTasks,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        )
+        TuningConfigBuilder.forParallelIndexTask().withMaxNumConcurrentSubTasks(numTotalSubTasks).build()
     );
 
     // set up test tools
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskResourceTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskResourceTest.java
index 01d502de85c..50939a99d8a 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskResourceTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskResourceTest.java
@@ -39,6 +39,7 @@ import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.task.AbstractTask;
 import org.apache.druid.indexing.common.task.SegmentAllocators;
 import org.apache.druid.indexing.common.task.TaskResource;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexTaskRunner.SubTaskSpecStatus;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.ISE;
@@ -415,40 +416,7 @@ public class ParallelIndexSupervisorTaskResourceTest extends AbstractParallelInd
             null
         ),
         ioConfig,
-        new ParallelIndexTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            NUM_SUB_TASKS,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        )
+        TuningConfigBuilder.forParallelIndexTask().withMaxNumConcurrentSubTasks(NUM_SUB_TASKS).build()
     );
 
     return new TestSupervisorTask(
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskSerdeTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskSerdeTest.java
index 7b92ba44bd9..cd588d0b6ee 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskSerdeTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskSerdeTest.java
@@ -31,13 +31,13 @@ import org.apache.druid.indexer.partitions.SingleDimensionPartitionsSpec;
 import org.apache.druid.indexing.common.TestUtils;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.indexing.common.task.TaskResource;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
 import org.apache.druid.segment.indexing.DataSchema;
 import org.apache.druid.segment.indexing.granularity.UniformGranularitySpec;
-import org.hamcrest.CoreMatchers;
 import org.joda.time.Interval;
 import org.junit.Assert;
 import org.junit.Rule;
@@ -58,16 +58,9 @@ public class ParallelIndexSupervisorTaskSerdeTest
     NullHandling.initializeForTests();
   }
 
-  private static final ObjectMapper OBJECT_MAPPER = createObjectMapper();
+  private static final ObjectMapper OBJECT_MAPPER = new TestUtils().getTestObjectMapper();
   private static final List<Interval> INTERVALS = Collections.singletonList(Intervals.of("2018/2019"));
 
-  private static ObjectMapper createObjectMapper()
-  {
-    TestUtils testUtils = new TestUtils();
-    ObjectMapper objectMapper = testUtils.getTestObjectMapper();
-    return objectMapper;
-  }
-
   @Rule
   public ExpectedException expectedException = ExpectedException.none();
 
@@ -89,19 +82,18 @@ public class ParallelIndexSupervisorTaskSerdeTest
   @Test
   public void forceGuaranteedRollupWithHashPartitionsMissingNumShards()
   {
-    Integer numShards = null;
     ParallelIndexSupervisorTask task = new ParallelIndexSupervisorTaskBuilder()
         .ingestionSpec(
             new ParallelIndexIngestionSpecBuilder()
                 .forceGuaranteedRollup(true)
-                .partitionsSpec(new HashedPartitionsSpec(null, numShards, null))
+                .partitionsSpec(new HashedPartitionsSpec(null, null, null))
                 .inputIntervals(INTERVALS)
                 .build()
         )
         .build();
 
     PartitionsSpec partitionsSpec = task.getIngestionSchema().getTuningConfig().getPartitionsSpec();
-    Assert.assertThat(partitionsSpec, CoreMatchers.instanceOf(HashedPartitionsSpec.class));
+    Assert.assertTrue(partitionsSpec instanceof HashedPartitionsSpec);
   }
 
   @Test
@@ -119,7 +111,7 @@ public class ParallelIndexSupervisorTaskSerdeTest
         .build();
 
     PartitionsSpec partitionsSpec = task.getIngestionSchema().getTuningConfig().getPartitionsSpec();
-    Assert.assertThat(partitionsSpec, CoreMatchers.instanceOf(HashedPartitionsSpec.class));
+    Assert.assertTrue(partitionsSpec instanceof HashedPartitionsSpec);
   }
 
   @Test
@@ -153,7 +145,7 @@ public class ParallelIndexSupervisorTaskSerdeTest
         .build();
 
     PartitionsSpec partitionsSpec = task.getIngestionSchema().getTuningConfig().getPartitionsSpec();
-    Assert.assertThat(partitionsSpec, CoreMatchers.instanceOf(SingleDimensionPartitionsSpec.class));
+    Assert.assertTrue(partitionsSpec instanceof SingleDimensionPartitionsSpec);
   }
 
   private static class ParallelIndexSupervisorTaskBuilder
@@ -240,41 +232,11 @@ public class ParallelIndexSupervisorTaskSerdeTest
           null
       );
 
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTuningConfig(
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          partitionsSpec,
-          null,
-          null,
-          null,
-          forceGuaranteedRollup,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null
-      );
-
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withPartitionsSpec(partitionsSpec)
+          .withForceGuaranteedRollup(forceGuaranteedRollup)
+          .build();
       return new ParallelIndexIngestionSpec(dataSchema, ioConfig, tuningConfig);
     }
   }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskTest.java
index d763337978f..699476dbc16 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexSupervisorTaskTest.java
@@ -37,6 +37,7 @@ import org.apache.druid.indexer.partitions.SingleDimensionPartitionsSpec;
 import org.apache.druid.indexer.report.KillTaskReport;
 import org.apache.druid.indexer.report.TaskReport;
 import org.apache.druid.indexing.common.TaskToolbox;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.Intervals;
@@ -236,45 +237,32 @@ public class ParallelIndexSupervisorTaskTest
           appendToExisting,
           null
       );
-      final ParallelIndexTuningConfig tuningConfig = new ParallelIndexTuningConfig(
-          null,
-          null,
-          null,
-          10,
-          1000L,
-          null,
-          null,
-          null,
-          null,
-          new HashedPartitionsSpec(null, 10, null),
-          IndexSpec.builder()
-                   .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                   .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                   .withMetricCompression(CompressionStrategy.LZF)
-                   .withLongEncoding(LongEncodingStrategy.LONGS)
-                   .build(),
-          IndexSpec.DEFAULT,
-          1,
-          forceGuaranteedRollup,
-          true,
-          10000L,
-          OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-          null,
-          10,
-          100,
-          20L,
-          new Duration(3600),
-          128,
-          null,
-          null,
-          false,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null
-      );
+      final ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withMaxRowsInMemory(10)
+          .withMaxBytesInMemory(1000L)
+          .withPartitionsSpec(new HashedPartitionsSpec(null, 10, null))
+          .withIndexSpec(
+              IndexSpec.builder()
+                       .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                       .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
+                       .withMetricCompression(CompressionStrategy.LZF)
+                       .withLongEncoding(LongEncodingStrategy.LONGS)
+                       .build()
+          )
+          .withIndexSpecForIntermediatePersists(IndexSpec.DEFAULT)
+          .withMaxPendingPersists(1)
+          .withForceGuaranteedRollup(forceGuaranteedRollup)
+          .withReportParseExceptions(true)
+          .withPushTimeout(10000L)
+          .withSegmentWriteOutMediumFactory(OffHeapMemorySegmentWriteOutMediumFactory.instance())
+          .withMaxNumConcurrentSubTasks(10)
+          .withMaxRetry(100)
+          .withTaskStatusCheckPeriodMs(20L)
+          .withChatHandlerTimeout(new Duration(3600))
+          .withChatHandlerNumRetries(128)
+          .withLogParseExceptions(false)
+          .build();
       final ParallelIndexIngestionSpec indexIngestionSpec = new ParallelIndexIngestionSpec(
           new DataSchema(
               "datasource",
@@ -309,45 +297,32 @@ public class ParallelIndexSupervisorTaskTest
           false,
           null
       );
-      final ParallelIndexTuningConfig tuningConfig = new ParallelIndexTuningConfig(
-          null,
-          null,
-          null,
-          10,
-          1000L,
-          null,
-          null,
-          null,
-          null,
-          new HashedPartitionsSpec(null, 10, null),
-          IndexSpec.builder()
-                   .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                   .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                   .withMetricCompression(CompressionStrategy.LZF)
-                   .withLongEncoding(LongEncodingStrategy.LONGS)
-                   .build(),
-          IndexSpec.DEFAULT,
-          1,
-          true,
-          true,
-          10000L,
-          OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-          null,
-          10,
-          100,
-          20L,
-          new Duration(3600),
-          128,
-          null,
-          null,
-          false,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null
-      );
+      final ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withMaxRowsInMemory(10)
+          .withMaxBytesInMemory(1000L)
+          .withPartitionsSpec(new HashedPartitionsSpec(null, 10, null))
+          .withIndexSpec(
+              IndexSpec.builder()
+                       .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                       .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
+                       .withMetricCompression(CompressionStrategy.LZF)
+                       .withLongEncoding(LongEncodingStrategy.LONGS)
+                       .build()
+          )
+          .withIndexSpecForIntermediatePersists(IndexSpec.DEFAULT)
+          .withMaxPendingPersists(1)
+          .withForceGuaranteedRollup(true)
+          .withReportParseExceptions(true)
+          .withPushTimeout(10000L)
+          .withSegmentWriteOutMediumFactory(OffHeapMemorySegmentWriteOutMediumFactory.instance())
+          .withMaxNumConcurrentSubTasks(10)
+          .withMaxRetry(100)
+          .withTaskStatusCheckPeriodMs(20L)
+          .withChatHandlerTimeout(new Duration(3600))
+          .withChatHandlerNumRetries(128)
+          .withLogParseExceptions(false)
+          .build();
 
       expectedException.expect(IAE.class);
       expectedException.expectMessage("Cannot use parser and inputSource together. Try using inputFormat instead of parser.");
@@ -559,45 +534,33 @@ public class ParallelIndexSupervisorTaskTest
               appendToExisting,
               null
       );
-      final ParallelIndexTuningConfig tuningConfig = new ParallelIndexTuningConfig(
-              null,
-              null,
-              null,
-              10,
-              1000L,
-              null,
-              null,
-              null,
-              null,
-              new HashedPartitionsSpec(null, 10, null),
+      final ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withMaxRowsInMemory(10)
+          .withMaxBytesInMemory(1000L)
+          .withPartitionsSpec(new HashedPartitionsSpec(null, 10, null))
+          .withIndexSpec(
               IndexSpec.builder()
-                      .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                      .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                      .withMetricCompression(CompressionStrategy.LZF)
-                      .withLongEncoding(LongEncodingStrategy.LONGS)
-                      .build(),
-              IndexSpec.DEFAULT,
-              1,
-              forceGuaranteedRollup,
-              true,
-              10000L,
-              OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-              null,
-              10,
-              100,
-              20L,
-              new Duration(3600),
-              128,
-              null,
-              null,
-              false,
-              null,
-              null,
-              null,
-              null,
-              null,
-              null
-      );
+                       .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
+                       .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
+                       .withMetricCompression(CompressionStrategy.LZF)
+                       .withLongEncoding(LongEncodingStrategy.LONGS)
+                       .build()
+          )
+          .withIndexSpecForIntermediatePersists(IndexSpec.DEFAULT)
+          .withMaxPendingPersists(1)
+          .withForceGuaranteedRollup(forceGuaranteedRollup)
+          .withReportParseExceptions(true)
+          .withPushTimeout(10000L)
+          .withSegmentWriteOutMediumFactory(OffHeapMemorySegmentWriteOutMediumFactory.instance())
+          .withMaxNumConcurrentSubTasks(10)
+          .withMaxRetry(100)
+          .withTaskStatusCheckPeriodMs(20L)
+          .withChatHandlerTimeout(new Duration(3600))
+          .withChatHandlerNumRetries(128)
+          .withLogParseExceptions(false)
+          .build();
+
       final ParallelIndexIngestionSpec indexIngestionSpec = new ParallelIndexIngestionSpec(
               new DataSchema(
                       "datasource",
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTestingFactory.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTestingFactory.java
index 0a0d4d4692f..16976e827d2 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTestingFactory.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTestingFactory.java
@@ -26,30 +26,20 @@ import com.google.common.collect.ImmutableMap;
 import org.apache.druid.data.input.InputFormat;
 import org.apache.druid.data.input.InputSource;
 import org.apache.druid.data.input.impl.DimensionsSpec;
-import org.apache.druid.data.input.impl.JsonInputFormat;
 import org.apache.druid.data.input.impl.TimestampSpec;
-import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
-import org.apache.druid.indexer.partitions.PartitionsSpec;
-import org.apache.druid.indexer.partitions.SingleDimensionPartitionsSpec;
 import org.apache.druid.indexing.common.TestUtils;
 import org.apache.druid.indexing.common.task.TaskResource;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.query.aggregation.AggregatorFactory;
-import org.apache.druid.segment.IndexIO;
 import org.apache.druid.segment.indexing.DataSchema;
 import org.apache.druid.segment.indexing.granularity.ArbitraryGranularitySpec;
 import org.apache.druid.segment.indexing.granularity.GranularitySpec;
-import org.apache.druid.segment.realtime.appenderator.AppenderatorsManager;
 import org.apache.druid.segment.transform.TransformSpec;
 import org.apache.druid.timeline.partition.BuildingHashBasedNumberedShardSpec;
 import org.apache.druid.timeline.partition.HashPartitionFunction;
-import org.easymock.EasyMock;
-import org.joda.time.Duration;
 import org.joda.time.Interval;
 
-import javax.annotation.Nullable;
-import java.io.File;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
@@ -68,20 +58,6 @@ class ParallelIndexTestingFactory
   static final String SUBTASK_SPEC_ID = "subtask-spec-id";
   static final int NUM_ATTEMPTS = 1;
   static final Map<String, Object> CONTEXT = Collections.emptyMap();
-  static final ParallelIndexSupervisorTaskClientProvider TASK_CLIENT_PROVIDER = TestUtils.TASK_CLIENT_PROVIDER;
-  static final AppenderatorsManager APPENDERATORS_MANAGER = TestUtils.APPENDERATORS_MANAGER;
-  static final ShuffleClient SHUFFLE_CLIENT = new ShuffleClient()
-  {
-    @Override
-    public File fetchSegmentFile(
-        File partitionDir,
-        String supervisorTaskId,
-        PartitionLocation location
-    )
-    {
-      return null;
-    }
-  };
   static final List<Interval> INPUT_INTERVALS = Collections.singletonList(Intervals.ETERNITY);
   static final String TASK_EXECUTOR_HOST = "task-executor-host";
   static final int TASK_EXECUTOR_PORT = 1;
@@ -113,83 +89,6 @@ class ParallelIndexTestingFactory
     return TEST_UTILS.getTestObjectMapper();
   }
 
-  static IndexIO getIndexIO()
-  {
-    return TEST_UTILS.getTestIndexIO();
-  }
-
-  @SuppressWarnings("SameParameterValue")
-  static class TuningConfigBuilder
-  {
-    private PartitionsSpec partitionsSpec =
-        new HashedPartitionsSpec(null, 2, null);
-    private boolean forceGuaranteedRollup = true;
-    private boolean logParseExceptions = false;
-    private int maxParseExceptions = Integer.MAX_VALUE;
-
-    TuningConfigBuilder partitionsSpec(PartitionsSpec partitionsSpec)
-    {
-      this.partitionsSpec = partitionsSpec;
-      return this;
-    }
-
-    TuningConfigBuilder forceGuaranteedRollup(boolean forceGuaranteedRollup)
-    {
-      this.forceGuaranteedRollup = forceGuaranteedRollup;
-      return this;
-    }
-
-    TuningConfigBuilder logParseExceptions(boolean logParseExceptions)
-    {
-      this.logParseExceptions = logParseExceptions;
-      return this;
-    }
-
-    TuningConfigBuilder maxParseExceptions(int maxParseExceptions)
-    {
-      this.maxParseExceptions = maxParseExceptions;
-      return this;
-    }
-
-    ParallelIndexTuningConfig build()
-    {
-      return new ParallelIndexTuningConfig(
-          1,
-          null,
-          null,
-          3,
-          4L,
-          null,
-          5L,
-          6,
-          null,
-          partitionsSpec,
-          null,
-          null,
-          10,
-          forceGuaranteedRollup,
-          false,
-          14L,
-          null,
-          null,
-          16,
-          17,
-          18L,
-          Duration.ZERO,
-          20,
-          21,
-          22,
-          logParseExceptions,
-          maxParseExceptions,
-          25,
-          null,
-          null,
-          null,
-          2
-      );
-    }
-  }
-
   static DataSchema createDataSchema(List<Interval> granularitySpecInputIntervals)
   {
     GranularitySpec granularitySpec = new ArbitraryGranularitySpec(Granularities.DAY, granularitySpecInputIntervals);
@@ -222,47 +121,6 @@ class ParallelIndexTestingFactory
     return new ParallelIndexIngestionSpec(dataSchema, ioConfig, tuningConfig);
   }
 
-  static class SingleDimensionPartitionsSpecBuilder
-  {
-    @Nullable
-    private String partitionDimension = SCHEMA_DIMENSION;
-    private boolean assumeGrouped = false;
-
-    SingleDimensionPartitionsSpecBuilder partitionDimension(@Nullable String partitionDimension)
-    {
-      this.partitionDimension = partitionDimension;
-      return this;
-    }
-
-    SingleDimensionPartitionsSpecBuilder assumeGrouped(boolean assumeGrouped)
-    {
-      this.assumeGrouped = assumeGrouped;
-      return this;
-    }
-
-    SingleDimensionPartitionsSpec build()
-    {
-      return new SingleDimensionPartitionsSpec(
-          1,
-          null,
-          partitionDimension,
-          assumeGrouped
-      );
-    }
-  }
-
-  static ParallelIndexSupervisorTaskClientProvider createTaskClientFactory()
-  {
-    return (supervisorTaskId, httpTimeout, numRetries) -> createTaskClient();
-  }
-
-  private static ParallelIndexSupervisorTaskClient createTaskClient()
-  {
-    ParallelIndexSupervisorTaskClient taskClient = EasyMock.niceMock(ParallelIndexSupervisorTaskClient.class);
-    EasyMock.replay(taskClient);
-    return taskClient;
-  }
-
   static String createRow(long timestamp, Object dimensionValue)
   {
     try {
@@ -287,9 +145,4 @@ class ParallelIndexTestingFactory
       throw new RuntimeException(e);
     }
   }
-
-  static InputFormat getInputFormat()
-  {
-    return new JsonInputFormat(null, null, null, null, null);
-  }
 }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTuningConfigTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTuningConfigTest.java
index a3f775509e2..33d6a7aaa76 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTuningConfigTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/ParallelIndexTuningConfigTest.java
@@ -22,17 +22,14 @@ package org.apache.druid.indexing.common.task.batch.parallel;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.fasterxml.jackson.databind.jsontype.NamedType;
 import nl.jqno.equalsverifier.EqualsVerifier;
+import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
 import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
-import org.apache.druid.indexer.partitions.SingleDimensionPartitionsSpec;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.segment.IndexSpec;
-import org.apache.druid.segment.data.CompressionFactory.LongEncodingStrategy;
 import org.apache.druid.segment.data.CompressionStrategy;
-import org.apache.druid.segment.data.RoaringBitmapSerdeFactory;
 import org.apache.druid.segment.indexing.TuningConfig;
-import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
-import org.joda.time.Duration;
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Rule;
@@ -40,6 +37,7 @@ import org.junit.Test;
 import org.junit.rules.ExpectedException;
 
 import java.io.IOException;
+import java.util.Collections;
 
 public class ParallelIndexTuningConfigTest
 {
@@ -57,201 +55,53 @@ public class ParallelIndexTuningConfigTest
   @Test
   public void testSerdeDefault() throws IOException
   {
-    final ParallelIndexTuningConfig tuningConfig = ParallelIndexTuningConfig.defaultConfig();
-    final byte[] json = mapper.writeValueAsBytes(tuningConfig);
-    final ParallelIndexTuningConfig fromJson = (ParallelIndexTuningConfig) mapper.readValue(json, TuningConfig.class);
-    Assert.assertEquals(fromJson, tuningConfig);
+    verifyConfigSerde(ParallelIndexTuningConfig.defaultConfig());
   }
 
   @Test
-  public void testSerdeWithMaxRowsPerSegment()
-      throws IOException
+  public void testSerdeWithNullMaxRowsPerSegment() throws IOException
   {
-    final ParallelIndexTuningConfig tuningConfig = new ParallelIndexTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(100, 100L),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        false,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        null,
-        250,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null,
-        2
-    );
-    final byte[] json = mapper.writeValueAsBytes(tuningConfig);
-    final ParallelIndexTuningConfig fromJson = (ParallelIndexTuningConfig) mapper.readValue(json, TuningConfig.class);
-    Assert.assertEquals(fromJson, tuningConfig);
+    final ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forParallelIndexTask()
+        .withMaxRowsInMemory(10)
+        .withMaxBytesInMemory(1000L)
+        .withPartitionsSpec(new DynamicPartitionsSpec(100, 1000L))
+        .withForceGuaranteedRollup(false)
+        .build();
+    verifyConfigSerde(tuningConfig);
   }
 
   @Test
   public void testSerdeWithMaxNumConcurrentSubTasks() throws IOException
   {
-    final int maxNumConcurrentSubTasks = 250;
-    final ParallelIndexTuningConfig tuningConfig = new ParallelIndexTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(100, 100L),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        false,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        null,
-        maxNumConcurrentSubTasks,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null,
-        2
-    );
-    final byte[] json = mapper.writeValueAsBytes(tuningConfig);
-    final ParallelIndexTuningConfig fromJson = (ParallelIndexTuningConfig) mapper.readValue(json, TuningConfig.class);
-    Assert.assertEquals(fromJson, tuningConfig);
+    final ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forParallelIndexTask()
+        .withMaxNumConcurrentSubTasks(250)
+        .build();
+    verifyConfigSerde(tuningConfig);
   }
 
   @Test
   public void testSerdeWithMaxNumSubTasks() throws IOException
   {
-    final int maxNumSubTasks = 250;
-    final ParallelIndexTuningConfig tuningConfig = new ParallelIndexTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(100, 100L),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        false,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        maxNumSubTasks,
-        null,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null,
-        2
-    );
-    final byte[] json = mapper.writeValueAsBytes(tuningConfig);
-    final ParallelIndexTuningConfig fromJson = (ParallelIndexTuningConfig) mapper.readValue(json, TuningConfig.class);
-    Assert.assertEquals(fromJson, tuningConfig);
+    final ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forParallelIndexTask()
+        .withMaxNumSubTasks(250)
+        .build();
+    verifyConfigSerde(tuningConfig);
   }
 
   @Test
-  public void testSerdeWithMaxNumSubTasksAndMaxNumConcurrentSubTasks()
+  public void testConfigWithBothMaxNumSubTasksAndMaxNumConcurrentSubTasksIsInvalid()
   {
     expectedException.expect(IllegalArgumentException.class);
     expectedException.expectMessage("Can't use both maxNumSubTasks and maxNumConcurrentSubTasks");
     final int maxNumSubTasks = 250;
-    final ParallelIndexTuningConfig tuningConfig = new ParallelIndexTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(100, 100L),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        false,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        maxNumSubTasks,
-        maxNumSubTasks,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    TuningConfigBuilder
+        .forParallelIndexTask()
+        .withMaxNumSubTasks(maxNumSubTasks)
+        .withMaxNumConcurrentSubTasks(maxNumSubTasks)
+        .build();
   }
 
   @Test
@@ -259,46 +109,11 @@ public class ParallelIndexTuningConfigTest
   {
     expectedException.expect(IllegalArgumentException.class);
     expectedException.expectMessage("DynamicPartitionsSpec must be used for best-effort rollup");
-    final boolean forceGuaranteedRollup = false;
-    new ParallelIndexTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new HashedPartitionsSpec(null, 10, null),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        forceGuaranteedRollup,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        null,
-        10,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    TuningConfigBuilder
+        .forParallelIndexTask()
+        .withPartitionsSpec(new HashedPartitionsSpec(null, 10, null))
+        .withForceGuaranteedRollup(false)
+        .build();
   }
 
   @Test
@@ -306,46 +121,11 @@ public class ParallelIndexTuningConfigTest
   {
     expectedException.expect(IllegalArgumentException.class);
     expectedException.expectMessage("DynamicPartitionsSpec must be used for best-effort rollup");
-    final boolean forceGuaranteedRollup = false;
-    new ParallelIndexTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new SingleDimensionPartitionsSpec(100, null, "dim", false),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        forceGuaranteedRollup,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        null,
-        10,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    TuningConfigBuilder
+        .forParallelIndexTask()
+        .withPartitionsSpec(new DimensionRangePartitionsSpec(null, 100, Collections.singletonList("dim1"), false))
+        .withForceGuaranteedRollup(false)
+        .build();
   }
 
   @Test
@@ -353,46 +133,19 @@ public class ParallelIndexTuningConfigTest
   {
     expectedException.expect(IllegalArgumentException.class);
     expectedException.expectMessage("cannot be used for perfect rollup");
-    final boolean forceGuaranteedRollup = true;
-    new ParallelIndexTuningConfig(
-        null,
-        null,
-        null,
-        10,
-        1000L,
-        null,
-        null,
-        null,
-        null,
-        new DynamicPartitionsSpec(100, null),
-        IndexSpec.builder()
-                 .withBitmapSerdeFactory(RoaringBitmapSerdeFactory.getInstance())
-                 .withDimensionCompression(CompressionStrategy.UNCOMPRESSED)
-                 .withMetricCompression(CompressionStrategy.LZF)
-                 .withLongEncoding(LongEncodingStrategy.LONGS)
-                 .build(),
-        IndexSpec.DEFAULT,
-        1,
-        forceGuaranteedRollup,
-        true,
-        10000L,
-        OffHeapMemorySegmentWriteOutMediumFactory.instance(),
-        null,
-        10,
-        100,
-        20L,
-        new Duration(3600),
-        128,
-        null,
-        null,
-        false,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
+    TuningConfigBuilder
+        .forParallelIndexTask()
+        .withPartitionsSpec(new DynamicPartitionsSpec(100, null))
+        .withForceGuaranteedRollup(true)
+        .build();
+  }
+
+  private void verifyConfigSerde(ParallelIndexTuningConfig tuningConfig) throws IOException
+  {
+    final byte[] json = mapper.writeValueAsBytes(tuningConfig);
+    final ParallelIndexTuningConfig fromJson =
+        (ParallelIndexTuningConfig) mapper.readValue(json, TuningConfig.class);
+    Assert.assertEquals(fromJson, tuningConfig);
   }
 
   @Test
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialDimensionCardinalityTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialDimensionCardinalityTaskTest.java
index c4ae9392450..0c33f002a61 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialDimensionCardinalityTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialDimensionCardinalityTaskTest.java
@@ -29,14 +29,17 @@ import org.apache.druid.data.input.InputFormat;
 import org.apache.druid.data.input.InputSource;
 import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.data.input.impl.InlineInputSource;
+import org.apache.druid.data.input.impl.JsonInputFormat;
 import org.apache.druid.indexer.TaskState;
 import org.apache.druid.indexer.TaskStatus;
+import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
 import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
 import org.apache.druid.indexer.partitions.PartitionsSpec;
 import org.apache.druid.indexer.partitions.SingleDimensionPartitionsSpec;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.stats.DropwizardRowIngestionMetersFactory;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.granularity.Granularities;
@@ -52,7 +55,6 @@ import org.apache.druid.testing.junit.LoggerCaptureRule;
 import org.apache.logging.log4j.core.LogEvent;
 import org.easymock.Capture;
 import org.easymock.EasyMock;
-import org.hamcrest.Matchers;
 import org.joda.time.Interval;
 import org.junit.Assert;
 import org.junit.Before;
@@ -82,9 +84,10 @@ public class PartialDimensionCardinalityTaskTest
       exception.expect(IllegalArgumentException.class);
       exception.expectMessage("forceGuaranteedRollup must be set");
 
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .forceGuaranteedRollup(false)
-          .partitionsSpec(new DynamicPartitionsSpec(null, null))
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withPartitionsSpec(new DynamicPartitionsSpec(null, null))
+          .withForceGuaranteedRollup(false)
           .build();
 
       new PartialDimensionCardinalityTaskBuilder()
@@ -100,7 +103,10 @@ public class PartialDimensionCardinalityTaskTest
 
       PartitionsSpec partitionsSpec = new SingleDimensionPartitionsSpec(null, 1, "a", false);
       ParallelIndexTuningConfig tuningConfig =
-          new ParallelIndexTestingFactory.TuningConfigBuilder().partitionsSpec(partitionsSpec).build();
+          TuningConfigBuilder.forParallelIndexTask()
+                             .withForceGuaranteedRollup(true)
+                             .withPartitionsSpec(partitionsSpec)
+                             .build();
 
       new PartialDimensionCardinalityTaskBuilder()
           .tuningConfig(tuningConfig)
@@ -136,7 +142,7 @@ public class PartialDimensionCardinalityTaskTest
       PartialDimensionCardinalityTask task = new PartialDimensionCardinalityTaskBuilder()
           .id(ParallelIndexTestingFactory.AUTOMATIC_ID)
           .build();
-      Assert.assertThat(task.getId(), Matchers.startsWith(PartialDimensionCardinalityTask.TYPE));
+      Assert.assertTrue(task.getId().startsWith(PartialDimensionCardinalityTask.TYPE));
     }
   }
 
@@ -176,9 +182,11 @@ public class PartialDimensionCardinalityTaskTest
       exception.expect(IllegalArgumentException.class);
       exception.expectMessage("partitionDimensions must be specified");
 
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(
-              new ParallelIndexTestingFactory.SingleDimensionPartitionsSpecBuilder().partitionDimension(null).build()
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withForceGuaranteedRollup(true)
+          .withPartitionsSpec(
+              new DimensionRangePartitionsSpec(null, null, null, false)
           )
           .build();
       PartialDimensionCardinalityTask task = new PartialDimensionCardinalityTaskBuilder()
@@ -195,9 +203,11 @@ public class PartialDimensionCardinalityTaskTest
       InputSource inlineInputSource = new InlineInputSource(
           ParallelIndexTestingFactory.createRow(invalidTimestamp, "a")
       );
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(HASHED_PARTITIONS_SPEC)
-          .logParseExceptions(true)
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withPartitionsSpec(HASHED_PARTITIONS_SPEC)
+          .withForceGuaranteedRollup(true)
+          .withLogParseExceptions(true)
           .build();
       PartialDimensionCardinalityTask task = new PartialDimensionCardinalityTaskBuilder()
           .inputSource(inlineInputSource)
@@ -209,15 +219,17 @@ public class PartialDimensionCardinalityTaskTest
       List<LogEvent> logEvents = logger.getLogEvents();
       Assert.assertEquals(1, logEvents.size());
       String logMessage = logEvents.get(0).getMessage().getFormattedMessage();
-      Assert.assertThat(logMessage, Matchers.containsString("Encountered parse exception"));
+      Assert.assertTrue(logMessage.contains("Encountered parse exception"));
     }
 
     @Test
     public void doesNotLogParseExceptionsIfDisabled() throws Exception
     {
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(HASHED_PARTITIONS_SPEC)
-          .logParseExceptions(false)
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withPartitionsSpec(HASHED_PARTITIONS_SPEC)
+          .withForceGuaranteedRollup(true)
+          .withLogParseExceptions(false)
           .build();
       PartialDimensionCardinalityTask task = new PartialDimensionCardinalityTaskBuilder()
           .tuningConfig(tuningConfig)
@@ -231,9 +243,11 @@ public class PartialDimensionCardinalityTaskTest
     @Test
     public void failsWhenTooManyParseExceptions() throws Exception
     {
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(HASHED_PARTITIONS_SPEC)
-          .maxParseExceptions(0)
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withPartitionsSpec(HASHED_PARTITIONS_SPEC)
+          .withForceGuaranteedRollup(true)
+          .withMaxParseExceptions(0)
           .build();
       PartialDimensionCardinalityTask task = new PartialDimensionCardinalityTaskBuilder()
           .tuningConfig(tuningConfig)
@@ -273,11 +287,12 @@ public class PartialDimensionCardinalityTaskTest
           ParallelIndexTestingFactory.createRowFromMap(0, ImmutableMap.of("dim1", "b", "dim2", "3")) + "\n" +
           ParallelIndexTestingFactory.createRowFromMap(0, ImmutableMap.of("dim1", "b", "dim2", "4"))
       );
-      HashedPartitionsSpec partitionsSpec = new HashedPartitionsSpec(null, null,
-                                                                     Collections.singletonList("dim1")
-      );
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(partitionsSpec)
+      HashedPartitionsSpec partitionsSpec =
+          new HashedPartitionsSpec(null, null, Collections.singletonList("dim1"));
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withPartitionsSpec(partitionsSpec)
+          .withForceGuaranteedRollup(true)
           .build();
 
       PartialDimensionCardinalityTaskBuilder taskBuilder = new PartialDimensionCardinalityTaskBuilder()
@@ -357,12 +372,14 @@ public class PartialDimensionCardinalityTaskTest
 
   private static class PartialDimensionCardinalityTaskBuilder
   {
-    private static final InputFormat INPUT_FORMAT = ParallelIndexTestingFactory.getInputFormat();
+    private static final InputFormat INPUT_FORMAT = new JsonInputFormat(null, null, null, null, null);
 
     private String id = ParallelIndexTestingFactory.ID;
     private InputSource inputSource = new InlineInputSource("row-with-invalid-timestamp");
-    private ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-        .partitionsSpec(HASHED_PARTITIONS_SPEC)
+    private ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forParallelIndexTask()
+        .withPartitionsSpec(HASHED_PARTITIONS_SPEC)
+        .withForceGuaranteedRollup(true)
         .build();
     private DataSchema dataSchema =
         ParallelIndexTestingFactory
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialDimensionDistributionTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialDimensionDistributionTaskTest.java
index 1346b29d889..2f5c477e3f5 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialDimensionDistributionTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialDimensionDistributionTaskTest.java
@@ -19,21 +19,21 @@
 
 package org.apache.druid.indexing.common.task.batch.parallel;
 
-import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.base.Joiner;
 import com.google.common.collect.Iterables;
 import org.apache.druid.data.input.InputFormat;
 import org.apache.druid.data.input.InputSource;
 import org.apache.druid.data.input.StringTuple;
 import org.apache.druid.data.input.impl.InlineInputSource;
+import org.apache.druid.data.input.impl.JsonInputFormat;
 import org.apache.druid.indexer.TaskState;
 import org.apache.druid.indexer.TaskStatus;
-import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
+import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
 import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
-import org.apache.druid.indexer.partitions.PartitionsSpec;
 import org.apache.druid.indexer.partitions.SingleDimensionPartitionsSpec;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.stats.DropwizardRowIngestionMetersFactory;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.indexing.common.task.batch.parallel.distribution.StringDistribution;
 import org.apache.druid.indexing.common.task.batch.parallel.distribution.StringSketch;
 import org.apache.druid.java.util.common.StringUtils;
@@ -48,7 +48,6 @@ import org.apache.druid.timeline.partition.PartitionBoundaries;
 import org.apache.logging.log4j.core.LogEvent;
 import org.easymock.Capture;
 import org.easymock.EasyMock;
-import org.hamcrest.Matchers;
 import org.joda.time.Interval;
 import org.junit.Assert;
 import org.junit.Before;
@@ -68,9 +67,8 @@ import java.util.stream.IntStream;
 
 public class PartialDimensionDistributionTaskTest
 {
-  private static final ObjectMapper OBJECT_MAPPER = ParallelIndexTestingFactory.createObjectMapper();
   private static final SingleDimensionPartitionsSpec SINGLE_DIM_PARTITIONS_SPEC =
-      new ParallelIndexTestingFactory.SingleDimensionPartitionsSpecBuilder().build();
+      new SingleDimensionPartitionsSpec(null, 1000, "dim", false);
 
   public static class ConstructorTest
   {
@@ -83,9 +81,9 @@ public class PartialDimensionDistributionTaskTest
       exception.expect(IllegalArgumentException.class);
       exception.expectMessage("forceGuaranteedRollup must be set");
 
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .forceGuaranteedRollup(false)
-          .partitionsSpec(new DynamicPartitionsSpec(null, null))
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withForceGuaranteedRollup(false)
           .build();
 
       new PartialDimensionDistributionTaskBuilder()
@@ -99,9 +97,11 @@ public class PartialDimensionDistributionTaskTest
       exception.expect(IllegalArgumentException.class);
       exception.expectMessage("range partitionsSpec required");
 
-      PartitionsSpec partitionsSpec = new HashedPartitionsSpec(null, 1, null);
       ParallelIndexTuningConfig tuningConfig =
-          new ParallelIndexTestingFactory.TuningConfigBuilder().partitionsSpec(partitionsSpec).build();
+          TuningConfigBuilder.forParallelIndexTask()
+                             .withForceGuaranteedRollup(true)
+                             .withPartitionsSpec(new HashedPartitionsSpec(null, 1, null))
+                             .build();
 
       new PartialDimensionDistributionTaskBuilder()
           .tuningConfig(tuningConfig)
@@ -114,7 +114,7 @@ public class PartialDimensionDistributionTaskTest
       PartialDimensionDistributionTask task = new PartialDimensionDistributionTaskBuilder()
           .id(ParallelIndexTestingFactory.AUTOMATIC_ID)
           .build();
-      Assert.assertThat(task.getId(), Matchers.startsWith(PartialDimensionDistributionTask.TYPE));
+      Assert.assertTrue(task.getId().startsWith(PartialDimensionDistributionTask.TYPE));
     }
   }
 
@@ -154,10 +154,10 @@ public class PartialDimensionDistributionTaskTest
       exception.expect(IllegalArgumentException.class);
       exception.expectMessage("partitionDimensions must be specified");
 
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(
-              new ParallelIndexTestingFactory.SingleDimensionPartitionsSpecBuilder().partitionDimension(null).build()
-          )
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withForceGuaranteedRollup(true)
+          .withPartitionsSpec(new DimensionRangePartitionsSpec(null, null, null, false))
           .build();
       PartialDimensionDistributionTask task = new PartialDimensionDistributionTaskBuilder()
           .tuningConfig(tuningConfig)
@@ -173,9 +173,11 @@ public class PartialDimensionDistributionTaskTest
       InputSource inlineInputSource = new InlineInputSource(
           ParallelIndexTestingFactory.createRow(invalidTimestamp, "a")
       );
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(SINGLE_DIM_PARTITIONS_SPEC)
-          .logParseExceptions(true)
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withForceGuaranteedRollup(true)
+          .withPartitionsSpec(SINGLE_DIM_PARTITIONS_SPEC)
+          .withLogParseExceptions(true)
           .build();
       PartialDimensionDistributionTask task = new PartialDimensionDistributionTaskBuilder()
           .inputSource(inlineInputSource)
@@ -187,15 +189,17 @@ public class PartialDimensionDistributionTaskTest
       List<LogEvent> logEvents = logger.getLogEvents();
       Assert.assertEquals(1, logEvents.size());
       String logMessage = logEvents.get(0).getMessage().getFormattedMessage();
-      Assert.assertThat(logMessage, Matchers.containsString("Encountered parse exception"));
+      Assert.assertTrue(logMessage.contains("Encountered parse exception"));
     }
 
     @Test
     public void doesNotLogParseExceptionsIfDisabled() throws Exception
     {
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(SINGLE_DIM_PARTITIONS_SPEC)
-          .logParseExceptions(false)
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withForceGuaranteedRollup(true)
+          .withPartitionsSpec(SINGLE_DIM_PARTITIONS_SPEC)
+          .withLogParseExceptions(false)
           .build();
       PartialDimensionDistributionTask task = new PartialDimensionDistributionTaskBuilder()
           .tuningConfig(tuningConfig)
@@ -209,9 +213,11 @@ public class PartialDimensionDistributionTaskTest
     @Test
     public void failsWhenTooManyParseExceptions() throws Exception
     {
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(SINGLE_DIM_PARTITIONS_SPEC)
-          .maxParseExceptions(0)
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withForceGuaranteedRollup(true)
+          .withPartitionsSpec(SINGLE_DIM_PARTITIONS_SPEC)
+          .withMaxParseExceptions(0)
           .build();
       PartialDimensionDistributionTask task = new PartialDimensionDistributionTaskBuilder()
           .tuningConfig(tuningConfig)
@@ -247,9 +253,11 @@ public class PartialDimensionDistributionTaskTest
           ParallelIndexTestingFactory.createRow(timestamp, dimensionValue)
           + "\n" + ParallelIndexTestingFactory.createRow(timestamp + 1, dimensionValue)
       );
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(
-              new ParallelIndexTestingFactory.SingleDimensionPartitionsSpecBuilder().assumeGrouped(true).build()
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withForceGuaranteedRollup(true)
+          .withPartitionsSpec(
+              new DimensionRangePartitionsSpec(null, 1000, Collections.singletonList("dim1"), true)
           )
           .build();
       PartialDimensionDistributionTaskBuilder taskBuilder = new PartialDimensionDistributionTaskBuilder()
@@ -277,9 +285,11 @@ public class PartialDimensionDistributionTaskTest
           ParallelIndexTestingFactory.createRow(timestamp, dimensionValue)
           + "\n" + ParallelIndexTestingFactory.createRow(timestamp + 1, dimensionValue)
       );
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(
-              new ParallelIndexTestingFactory.SingleDimensionPartitionsSpecBuilder().assumeGrouped(false).build()
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withForceGuaranteedRollup(true)
+          .withPartitionsSpec(
+              new DimensionRangePartitionsSpec(null, 1000, Collections.singletonList("dim1"), false)
           )
           .build();
       PartialDimensionDistributionTaskBuilder taskBuilder = new PartialDimensionDistributionTaskBuilder()
@@ -321,9 +331,11 @@ public class PartialDimensionDistributionTaskTest
               rows.get(rows.size() - 1)
           )
       );
-      ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-          .partitionsSpec(
-              new ParallelIndexTestingFactory.SingleDimensionPartitionsSpecBuilder().assumeGrouped(false).build()
+      ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+          .forParallelIndexTask()
+          .withForceGuaranteedRollup(true)
+          .withPartitionsSpec(
+              new DimensionRangePartitionsSpec(null, 1000, Collections.singletonList("dim"), false)
           )
           .build();
       DataSchema dataSchema = ParallelIndexTestingFactory.createDataSchema(ParallelIndexTestingFactory.INPUT_INTERVALS);
@@ -401,12 +413,16 @@ public class PartialDimensionDistributionTaskTest
 
   private static class PartialDimensionDistributionTaskBuilder
   {
-    private static final InputFormat INPUT_FORMAT = ParallelIndexTestingFactory.getInputFormat();
+    private static final InputFormat INPUT_FORMAT = new JsonInputFormat(null, null, null, null, null);
 
     private String id = ParallelIndexTestingFactory.ID;
     private InputSource inputSource = new InlineInputSource("row-with-invalid-timestamp");
-    private ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-        .partitionsSpec(new ParallelIndexTestingFactory.SingleDimensionPartitionsSpecBuilder().build())
+    private ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forParallelIndexTask()
+        .withForceGuaranteedRollup(true)
+        .withPartitionsSpec(
+            new DimensionRangePartitionsSpec(null, 1000, Collections.singletonList("dim"), false)
+        )
         .build();
     private DataSchema dataSchema =
         ParallelIndexTestingFactory.createDataSchema(ParallelIndexTestingFactory.INPUT_INTERVALS);
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialGenericSegmentMergeTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialGenericSegmentMergeTaskTest.java
index a51856f7353..c56dae82849 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialGenericSegmentMergeTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialGenericSegmentMergeTaskTest.java
@@ -21,8 +21,8 @@ package org.apache.druid.indexing.common.task.batch.parallel;
 
 import com.google.common.collect.ImmutableMap;
 import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.segment.TestHelper;
-import org.hamcrest.Matchers;
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Rule;
@@ -38,7 +38,7 @@ import java.util.Collections;
 public class PartialGenericSegmentMergeTaskTest extends AbstractParallelIndexSupervisorTaskTest
 {
   @Parameterized.Parameters(name = "partitionLocation = {0}")
-  public static Iterable<? extends Object> data()
+  public static Iterable<?> data()
   {
     return Arrays.asList(
         GENERIC_PARTITION_LOCATION,
@@ -71,7 +71,6 @@ public class PartialGenericSegmentMergeTaskTest extends AbstractParallelIndexSup
   private PartialGenericSegmentMergeTask target;
   private PartialSegmentMergeIOConfig ioConfig;
   private HashedPartitionsSpec partitionsSpec;
-  private PartialSegmentMergeIngestionSpec ingestionSpec;
 
   public PartialGenericSegmentMergeTaskTest()
   {
@@ -88,12 +87,13 @@ public class PartialGenericSegmentMergeTaskTest extends AbstractParallelIndexSup
         1,
         Collections.emptyList()
     );
-    ingestionSpec = new PartialSegmentMergeIngestionSpec(
+    PartialSegmentMergeIngestionSpec ingestionSpec = new PartialSegmentMergeIngestionSpec(
         ParallelIndexTestingFactory.createDataSchema(ParallelIndexTestingFactory.INPUT_INTERVALS),
         ioConfig,
-        new ParallelIndexTestingFactory.TuningConfigBuilder()
-            .partitionsSpec(partitionsSpec)
-            .build()
+        TuningConfigBuilder.forParallelIndexTask()
+                           .withForceGuaranteedRollup(true)
+                           .withPartitionsSpec(partitionsSpec)
+                           .build()
     );
     target = new PartialGenericSegmentMergeTask(
         ParallelIndexTestingFactory.AUTOMATIC_ID,
@@ -117,7 +117,7 @@ public class PartialGenericSegmentMergeTaskTest extends AbstractParallelIndexSup
   public void hasCorrectPrefixForAutomaticId()
   {
     String id = target.getId();
-    Assert.assertThat(id, Matchers.startsWith(PartialGenericSegmentMergeTask.TYPE));
+    Assert.assertTrue(id.startsWith(PartialGenericSegmentMergeTask.TYPE));
   }
 
   @Test
@@ -136,8 +136,9 @@ public class PartialGenericSegmentMergeTaskTest extends AbstractParallelIndexSup
         new PartialSegmentMergeIngestionSpec(
             ParallelIndexTestingFactory.createDataSchema(null),
             ioConfig,
-            new ParallelIndexTestingFactory.TuningConfigBuilder()
-                .partitionsSpec(partitionsSpec)
+            TuningConfigBuilder.forParallelIndexTask()
+                .withForceGuaranteedRollup(true)
+                .withPartitionsSpec(partitionsSpec)
                 .build()
         ),
         ParallelIndexTestingFactory.CONTEXT
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialHashSegmentGenerateTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialHashSegmentGenerateTaskTest.java
index c2760209c01..a0b59d8c075 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialHashSegmentGenerateTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialHashSegmentGenerateTaskTest.java
@@ -25,6 +25,7 @@ import com.google.common.collect.ImmutableMap;
 import org.apache.druid.data.input.impl.JsonInputFormat;
 import org.apache.druid.data.input.impl.LocalInputSource;
 import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.indexing.common.task.batch.partition.HashPartitionAnalysis;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.granularity.Granularities;
@@ -53,7 +54,10 @@ public class PartialHashSegmentGenerateTaskTest
   private static final ParallelIndexIngestionSpec INGESTION_SPEC = ParallelIndexTestingFactory.createIngestionSpec(
       new LocalInputSource(new File("baseDir"), "filer"),
       new JsonInputFormat(null, null, null, null, null),
-      new ParallelIndexTestingFactory.TuningConfigBuilder().build(),
+      TuningConfigBuilder.forParallelIndexTask()
+                         .withForceGuaranteedRollup(true)
+                         .withPartitionsSpec(new HashedPartitionsSpec(null, 2, null))
+                         .build(),
       ParallelIndexTestingFactory.createDataSchema(ParallelIndexTestingFactory.INPUT_INTERVALS)
   );
 
@@ -180,7 +184,10 @@ public class PartialHashSegmentGenerateTaskTest
         ParallelIndexTestingFactory.createIngestionSpec(
             new LocalInputSource(new File("baseDir"), "filer"),
             new JsonInputFormat(null, null, null, null, null),
-            new ParallelIndexTestingFactory.TuningConfigBuilder().build(),
+            TuningConfigBuilder.forParallelIndexTask()
+                               .withForceGuaranteedRollup(true)
+                               .withPartitionsSpec(new HashedPartitionsSpec(null, 2, null))
+                               .build(),
             ParallelIndexTestingFactory.createDataSchema(null)
         ),
         ParallelIndexTestingFactory.CONTEXT,
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialRangeSegmentGenerateTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialRangeSegmentGenerateTaskTest.java
index cf18be0f748..cdeda412c6c 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialRangeSegmentGenerateTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialRangeSegmentGenerateTaskTest.java
@@ -24,9 +24,12 @@ import org.apache.druid.data.input.InputFormat;
 import org.apache.druid.data.input.InputSource;
 import org.apache.druid.data.input.StringTuple;
 import org.apache.druid.data.input.impl.InlineInputSource;
+import org.apache.druid.data.input.impl.JsonInputFormat;
+import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
 import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
 import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
 import org.apache.druid.indexer.partitions.PartitionsSpec;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.segment.TestHelper;
 import org.apache.druid.segment.indexing.DataSchema;
@@ -35,7 +38,6 @@ import org.apache.druid.server.security.Resource;
 import org.apache.druid.server.security.ResourceAction;
 import org.apache.druid.server.security.ResourceType;
 import org.apache.druid.timeline.partition.PartitionBoundaries;
-import org.hamcrest.Matchers;
 import org.junit.Assert;
 import org.junit.Rule;
 import org.junit.Test;
@@ -60,11 +62,10 @@ public class PartialRangeSegmentGenerateTaskTest extends AbstractParallelIndexSu
     exception.expect(IllegalArgumentException.class);
     exception.expectMessage("range or single_dim partitionsSpec required");
 
-    ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-        .forceGuaranteedRollup(false)
-        .partitionsSpec(new DynamicPartitionsSpec(null, null))
+    ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forParallelIndexTask()
+        .withPartitionsSpec(new DynamicPartitionsSpec(null, null))
         .build();
-
     new PartialRangeSegmentGenerateTaskBuilder()
         .tuningConfig(tuningConfig)
         .build();
@@ -77,8 +78,11 @@ public class PartialRangeSegmentGenerateTaskTest extends AbstractParallelIndexSu
     exception.expectMessage("range or single_dim partitionsSpec required");
 
     PartitionsSpec partitionsSpec = new HashedPartitionsSpec(null, 1, null);
-    ParallelIndexTuningConfig tuningConfig =
-        new ParallelIndexTestingFactory.TuningConfigBuilder().partitionsSpec(partitionsSpec).build();
+    ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forParallelIndexTask()
+        .withForceGuaranteedRollup(true)
+        .withPartitionsSpec(partitionsSpec)
+        .build();
 
     new PartialRangeSegmentGenerateTaskBuilder()
         .tuningConfig(tuningConfig)
@@ -123,16 +127,20 @@ public class PartialRangeSegmentGenerateTaskTest extends AbstractParallelIndexSu
   public void hasCorrectPrefixForAutomaticId()
   {
     PartialRangeSegmentGenerateTask task = new PartialRangeSegmentGenerateTaskBuilder().build();
-    Assert.assertThat(task.getId(), Matchers.startsWith(PartialRangeSegmentGenerateTask.TYPE));
+    Assert.assertTrue(task.getId().startsWith(PartialRangeSegmentGenerateTask.TYPE));
   }
 
   private static class PartialRangeSegmentGenerateTaskBuilder
   {
     private static final InputSource INPUT_SOURCE = new InlineInputSource("data");
-    private static final InputFormat INPUT_FORMAT = ParallelIndexTestingFactory.getInputFormat();
+    private static final InputFormat INPUT_FORMAT = new JsonInputFormat(null, null, null, null, null);
 
-    private ParallelIndexTuningConfig tuningConfig = new ParallelIndexTestingFactory.TuningConfigBuilder()
-        .partitionsSpec(new ParallelIndexTestingFactory.SingleDimensionPartitionsSpecBuilder().build())
+    private ParallelIndexTuningConfig tuningConfig = TuningConfigBuilder
+        .forParallelIndexTask()
+        .withForceGuaranteedRollup(true)
+        .withPartitionsSpec(
+            new DimensionRangePartitionsSpec(null, 1000, Collections.singletonList("dim"), false)
+        )
         .build();
     private DataSchema dataSchema =
         ParallelIndexTestingFactory.createDataSchema(ParallelIndexTestingFactory.INPUT_INTERVALS);
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentMergeIOConfigTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentMergeIOConfigTest.java
index a7901ab3164..e1a64af2731 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentMergeIOConfigTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentMergeIOConfigTest.java
@@ -64,15 +64,6 @@ public class PartialSegmentMergeIOConfigTest
   }
 
   private static final ObjectMapper OBJECT_MAPPER = ParallelIndexTestingFactory.createObjectMapper();
-  private static final GenericPartitionLocation GENERIC_PARTITION_LOCATION = new GenericPartitionLocation(
-      ParallelIndexTestingFactory.HOST,
-      ParallelIndexTestingFactory.PORT,
-      ParallelIndexTestingFactory.USE_HTTPS,
-      ParallelIndexTestingFactory.SUBTASK_ID,
-      ParallelIndexTestingFactory.INTERVAL,
-      ParallelIndexTestingFactory.HASH_BASED_NUMBERED_SHARD_SPEC
-  );
-
   private PartialSegmentMergeIOConfig target;
 
   @Before
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentMergeIngestionSpecTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentMergeIngestionSpecTest.java
index 04c28190b86..47549f2fabe 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentMergeIngestionSpecTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/PartialSegmentMergeIngestionSpecTest.java
@@ -22,6 +22,7 @@ package org.apache.druid.indexing.common.task.batch.parallel;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableMap;
 import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.segment.TestHelper;
 import org.junit.Before;
 import org.junit.Test;
@@ -37,7 +38,7 @@ public class PartialSegmentMergeIngestionSpecTest
   private static final ObjectMapper OBJECT_MAPPER = ParallelIndexTestingFactory.createObjectMapper();
 
   @Parameterized.Parameters(name = "partitionLocation = {0}")
-  public static Iterable<? extends Object> data()
+  public static Iterable<?> data()
   {
     return Arrays.asList(
         GENERIC_PARTITION_LOCATION,
@@ -65,24 +66,21 @@ public class PartialSegmentMergeIngestionSpecTest
   );
 
   private PartialSegmentMergeIngestionSpec target;
-  private PartialSegmentMergeIOConfig ioConfig;
-  private HashedPartitionsSpec partitionsSpec;
 
   @Before
   public void setup()
   {
-    ioConfig = new PartialSegmentMergeIOConfig(Collections.singletonList(partitionLocation));
-    partitionsSpec = new HashedPartitionsSpec(
-        null,
-        1,
-        Collections.emptyList()
-    );
+    PartialSegmentMergeIOConfig ioConfig =
+        new PartialSegmentMergeIOConfig(Collections.singletonList(partitionLocation));
+    HashedPartitionsSpec partitionsSpec =
+        new HashedPartitionsSpec(null, 1, Collections.emptyList());
     target = new PartialSegmentMergeIngestionSpec(
         ParallelIndexTestingFactory.createDataSchema(ParallelIndexTestingFactory.INPUT_INTERVALS),
         ioConfig,
-        new ParallelIndexTestingFactory.TuningConfigBuilder()
-            .partitionsSpec(partitionsSpec)
-            .build()
+        TuningConfigBuilder.forParallelIndexTask()
+                           .withForceGuaranteedRollup(true)
+                           .withPartitionsSpec(partitionsSpec)
+                           .build()
     );
   }
 
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/SinglePhaseParallelIndexingTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/SinglePhaseParallelIndexingTest.java
index 5ad774386b6..de060e521a9 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/SinglePhaseParallelIndexingTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/batch/parallel/SinglePhaseParallelIndexingTest.java
@@ -36,6 +36,7 @@ import org.apache.druid.indexing.common.LockGranularity;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.actions.TaskActionClient;
 import org.apache.druid.indexing.common.task.Tasks;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.StringUtils;
@@ -157,7 +158,7 @@ public class SinglePhaseParallelIndexingTest extends AbstractParallelIndexSuperv
   @Test
   public void testIsReady() throws Exception
   {
-    final ParallelIndexSupervisorTask task = newTask(INTERVAL_TO_INDEX, false, true);
+    final ParallelIndexSupervisorTask task = newTask(INTERVAL_TO_INDEX, true);
     final TaskActionClient actionClient = createActionClient(task);
     final TaskToolbox toolbox = createTaskToolbox(task, actionClient);
     prepareTaskForLocking(task);
@@ -534,7 +535,7 @@ public class SinglePhaseParallelIndexingTest extends AbstractParallelIndexSuperv
   {
     final Interval interval = Intervals.of("2017-12/P1M");
     final boolean appendToExisting = false;
-    final ParallelIndexSupervisorTask task = newTask(interval, appendToExisting, false);
+    final ParallelIndexSupervisorTask task = newTask(interval, false);
     task.addToContext(Tasks.FORCE_TIME_CHUNK_LOCK_KEY, lockGranularity == LockGranularity.TIME_CHUNK);
     Assert.assertEquals(TaskState.SUCCESS, getIndexingServiceClient().runAndWait(task).getStatusCode());
     assertShardSpec(task, lockGranularity, appendToExisting, Collections.emptyList());
@@ -583,7 +584,7 @@ public class SinglePhaseParallelIndexingTest extends AbstractParallelIndexSuperv
   @Test
   public void testPublishEmptySegments()
   {
-    final ParallelIndexSupervisorTask task = newTask(Intervals.of("2020-12/P1M"), false, true);
+    final ParallelIndexSupervisorTask task = newTask(Intervals.of("2020-12/P1M"), true);
     task.addToContext(Tasks.FORCE_TIME_CHUNK_LOCK_KEY, lockGranularity == LockGranularity.TIME_CHUNK);
     Assert.assertEquals(TaskState.SUCCESS, getIndexingServiceClient().runAndWait(task).getStatusCode());
   }
@@ -598,40 +599,9 @@ public class SinglePhaseParallelIndexingTest extends AbstractParallelIndexSuperv
         Granularities.DAY,
         appendToExisting,
         true,
-        new ParallelIndexTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            1,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
+        TuningConfigBuilder.forParallelIndexTask()
+                           .withMaxNumConcurrentSubTasks(1)
+                           .build(),
         VALID_INPUT_SOURCE_FILTER
     );
     task.addToContext(Tasks.FORCE_TIME_CHUNK_LOCK_KEY, lockGranularity == LockGranularity.TIME_CHUNK);
@@ -724,40 +694,10 @@ public class SinglePhaseParallelIndexingTest extends AbstractParallelIndexSuperv
         Granularities.DAY,
         appendToExisting,
         true,
-        new ParallelIndexTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            1,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            0,
-            null
-        ),
+        TuningConfigBuilder.forParallelIndexTask()
+                           .withMaxNumConcurrentSubTasks(1)
+                           .withMaxAllowedLockCount(0)
+                           .build(),
         VALID_INPUT_SOURCE_FILTER
     );
     task.addToContext(Tasks.FORCE_TIME_CHUNK_LOCK_KEY, lockGranularity == LockGranularity.TIME_CHUNK);
@@ -786,40 +726,10 @@ public class SinglePhaseParallelIndexingTest extends AbstractParallelIndexSuperv
         Granularities.DAY,
         appendToExisting,
         true,
-        new ParallelIndexTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            2,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            0,
-            null
-        ),
+        TuningConfigBuilder.forParallelIndexTask()
+                           .withMaxNumConcurrentSubTasks(2)
+                           .withMaxAllowedLockCount(0)
+                           .build(),
         VALID_INPUT_SOURCE_FILTER
     );
     task.addToContext(Tasks.FORCE_TIME_CHUNK_LOCK_KEY, lockGranularity == LockGranularity.TIME_CHUNK);
@@ -1006,11 +916,10 @@ public class SinglePhaseParallelIndexingTest extends AbstractParallelIndexSuperv
 
   private ParallelIndexSupervisorTask newTask(
       @Nullable Interval interval,
-      boolean appendToExisting,
       boolean splittableInputSource
   )
   {
-    return newTask(interval, Granularities.DAY, appendToExisting, splittableInputSource);
+    return newTask(interval, Granularities.DAY, false, splittableInputSource);
   }
 
   private ParallelIndexSupervisorTask newTask(
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/overlord/TaskLifecycleTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/overlord/TaskLifecycleTest.java
index 91d74a2bd67..7e421519963 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/overlord/TaskLifecycleTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/overlord/TaskLifecycleTest.java
@@ -76,7 +76,6 @@ import org.apache.druid.indexing.common.task.AbstractFixedIntervalTask;
 import org.apache.druid.indexing.common.task.IndexTask;
 import org.apache.druid.indexing.common.task.IndexTask.IndexIOConfig;
 import org.apache.druid.indexing.common.task.IndexTask.IndexIngestionSpec;
-import org.apache.druid.indexing.common.task.IndexTask.IndexTuningConfig;
 import org.apache.druid.indexing.common.task.KillUnusedSegmentsTask;
 import org.apache.druid.indexing.common.task.NoopTask;
 import org.apache.druid.indexing.common.task.NoopTaskContextEnricher;
@@ -84,6 +83,7 @@ import org.apache.druid.indexing.common.task.NoopTestTaskReportFileWriter;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.indexing.common.task.TaskResource;
 import org.apache.druid.indexing.common.task.TestAppenderatorsManager;
+import org.apache.druid.indexing.common.task.TuningConfigBuilder;
 import org.apache.druid.indexing.overlord.config.DefaultTaskConfig;
 import org.apache.druid.indexing.overlord.config.TaskLockConfig;
 import org.apache.druid.indexing.overlord.config.TaskQueueConfig;
@@ -730,33 +730,13 @@ public class TaskLifecycleTest extends InitializedNullHandlingTest
                 null
             ),
             new IndexIOConfig(null, new MockInputSource(), new NoopInputFormat(), false, false),
-            new IndexTuningConfig(
-                null,
-                10000,
-                null,
-                10,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                indexSpec,
-                null,
-                3,
-                false,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null
-            )
+            TuningConfigBuilder.forIndexTask()
+                               .withMaxRowsPerSegment(10000)
+                               .withMaxRowsInMemory(100)
+                               .withIndexSpec(indexSpec)
+                               .withMaxPendingPersists(3)
+                               .withForceGuaranteedRollup(false)
+                               .build()
         ),
         null
     );
@@ -815,33 +795,13 @@ public class TaskLifecycleTest extends InitializedNullHandlingTest
                 mapper
             ),
             new IndexIOConfig(null, new MockExceptionInputSource(), new NoopInputFormat(), false, false),
-            new IndexTuningConfig(
-                null,
-                10000,
-                null,
-                10,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                indexSpec,
-                null,
-                3,
-                false,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null
-            )
+            TuningConfigBuilder.forIndexTask()
+                               .withMaxRowsPerSegment(10000)
+                               .withMaxRowsInMemory(10)
+                               .withIndexSpec(indexSpec)
+                               .withMaxPendingPersists(3)
+                               .withForceGuaranteedRollup(false)
+                               .build()
         ),
         null
     );
@@ -1259,33 +1219,11 @@ public class TaskLifecycleTest extends InitializedNullHandlingTest
                 null
             ),
             new IndexIOConfig(null, new MockInputSource(), new NoopInputFormat(), false, false),
-            new IndexTuningConfig(
-                null,
-                10000,
-                null,
-                10,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                indexSpec,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null
-            )
+            TuningConfigBuilder.forIndexTask()
+                               .withMaxRowsPerSegment(10000)
+                               .withMaxRowsInMemory(10)
+                               .withIndexSpec(indexSpec)
+                               .build()
         ),
         null
     );
@@ -1371,33 +1309,13 @@ public class TaskLifecycleTest extends InitializedNullHandlingTest
                 null
             ),
             new IndexIOConfig(null, new MockInputSource(), new NoopInputFormat(), false, false),
-            new IndexTuningConfig(
-                null,
-                10000,
-                null,
-                10,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                indexSpec,
-                null,
-                3,
-                false,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null,
-                null
-            )
+            TuningConfigBuilder.forIndexTask()
+                               .withMaxRowsPerSegment(10000)
+                               .withMaxRowsInMemory(10)
+                               .withIndexSpec(indexSpec)
+                               .withMaxPendingPersists(3)
+                               .withForceGuaranteedRollup(false)
+                               .build()
         ),
         null
     );

From d6c760f7ce74b5864cd7d0750736f1609d171fdf Mon Sep 17 00:00:00 2001
From: AmatyaAvadhanula <amatya.avadhanula@imply.io>
Date: Mon, 15 Jul 2024 14:07:53 +0530
Subject: [PATCH 66/72] Do not kill segments with referenced load specs from
 deep storage (#16667)

Do not kill segments with referenced load specs from deep storage
---
 .../ActionBasedPublishedSegmentRetriever.java |   2 +-
 .../RetrieveUpgradedFromSegmentIdsAction.java |  90 +++++++
 .../RetrieveUpgradedToSegmentIdsAction.java   |  95 ++++++++
 .../indexing/common/actions/TaskAction.java   |   2 +
 .../actions/UpgradedFromSegmentsResponse.java |  44 ++++
 .../actions/UpgradedToSegmentsResponse.java   |  46 ++++
 .../common/task/KillUnusedSegmentsTask.java   | 150 ++++++++++--
 .../common/task/IngestionTestBase.java        |  13 +-
 .../task/KillUnusedSegmentsTaskTest.java      | 227 +++++++++++++++++-
 .../indexing/test/TestDataSegmentKiller.java  |  13 +-
 ...TestIndexerMetadataStorageCoordinator.java |  18 ++
 .../IndexerMetadataStorageCoordinator.java    |  17 ++
 .../IndexerSQLMetadataStorageCoordinator.java | 118 ++++++++-
 .../druid/metadata/PendingSegmentRecord.java  |   5 +-
 .../druid/metadata/SQLMetadataConnector.java  |  10 +
 .../metadata/SqlSegmentsMetadataQuery.java    |  13 +-
 .../druid/server/http/DataSegmentPlus.java    |  23 +-
 ...exerSQLMetadataStorageCoordinatorTest.java | 197 ++++++++++++++-
 ...SqlMetadataStorageCoordinatorTestBase.java |  49 ++++
 .../server/http/DataSegmentPlusTest.java      |   3 +-
 .../server/http/MetadataResourceTest.java     |   2 +-
 21 files changed, 1080 insertions(+), 57 deletions(-)
 create mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUpgradedFromSegmentIdsAction.java
 create mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUpgradedToSegmentIdsAction.java
 create mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/actions/UpgradedFromSegmentsResponse.java
 create mode 100644 indexing-service/src/main/java/org/apache/druid/indexing/common/actions/UpgradedToSegmentsResponse.java

diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetriever.java b/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetriever.java
index ba5cf923b12..bb349cc9790 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetriever.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/appenderator/ActionBasedPublishedSegmentRetriever.java
@@ -79,7 +79,7 @@ public class ActionBasedPublishedSegmentRetriever implements PublishedSegmentRet
     catch (Exception e) {
       log.warn(
           e,
-          "Could not retrieve published segment IDs[%s] using task action[segmentListById]."
+          "Could not retrieve published segment IDs[%s] using task action[retrieveSegmentsById]."
           + " Overlord maybe on an older version, retrying with action[segmentListUsed]."
           + " This task may fail to publish segments if there is a concurrent replace happening.",
           serializedSegmentIds
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUpgradedFromSegmentIdsAction.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUpgradedFromSegmentIdsAction.java
new file mode 100644
index 00000000000..67f7ae6e131
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUpgradedFromSegmentIdsAction.java
@@ -0,0 +1,90 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import com.fasterxml.jackson.core.type.TypeReference;
+import org.apache.druid.indexing.common.task.Task;
+
+import java.util.Set;
+
+/**
+ * Task action to retrieve the segment IDs from which a given set of segments were upgraded.
+ */
+public class RetrieveUpgradedFromSegmentIdsAction implements TaskAction<UpgradedFromSegmentsResponse>
+{
+  private final String dataSource;
+  private final Set<String> segmentIds;
+
+  @JsonCreator
+  public RetrieveUpgradedFromSegmentIdsAction(
+      @JsonProperty("dataSource") String dataSource,
+      @JsonProperty("segmentIds") Set<String> segmentIds
+  )
+  {
+    this.dataSource = dataSource;
+    this.segmentIds = segmentIds;
+  }
+
+  @JsonProperty
+  public String getDataSource()
+  {
+    return dataSource;
+  }
+
+  @JsonProperty
+  public Set<String> getSegmentIds()
+  {
+    return segmentIds;
+  }
+
+  @Override
+  public TypeReference<UpgradedFromSegmentsResponse> getReturnTypeReference()
+  {
+    return new TypeReference<UpgradedFromSegmentsResponse>()
+    {
+    };
+  }
+
+  @Override
+  public UpgradedFromSegmentsResponse perform(Task task, TaskActionToolbox toolbox)
+  {
+    return new UpgradedFromSegmentsResponse(
+        toolbox.getIndexerMetadataStorageCoordinator()
+               .retrieveUpgradedFromSegmentIds(dataSource, segmentIds)
+    );
+  }
+
+  @Override
+  public boolean isAudited()
+  {
+    return false;
+  }
+
+  @Override
+  public String toString()
+  {
+    return getClass().getSimpleName() + "{" +
+           "dataSource='" + dataSource + '\'' +
+           ", segmentIds=" + segmentIds +
+           '}';
+  }
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUpgradedToSegmentIdsAction.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUpgradedToSegmentIdsAction.java
new file mode 100644
index 00000000000..412c9604d11
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/RetrieveUpgradedToSegmentIdsAction.java
@@ -0,0 +1,95 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import com.fasterxml.jackson.core.type.TypeReference;
+import org.apache.druid.indexing.common.task.Task;
+
+import java.util.Set;
+
+/**
+ * Task action to determine the set of all segments containing the same load spec given the parent id. <br/>
+ * Returns a map from a segment ID to a set containing:
+ * <ol>
+ * <li> all segment IDs that were upgraded from it AND are still present in the metadata store </li>
+ * <li> the segment ID itself if and only if it is still present in the metadata store </li>
+ * </ol>
+ */
+public class RetrieveUpgradedToSegmentIdsAction implements TaskAction<UpgradedToSegmentsResponse>
+{
+  private final String dataSource;
+  private final Set<String> segmentIds;
+
+  @JsonCreator
+  public RetrieveUpgradedToSegmentIdsAction(
+      @JsonProperty("dataSource") String dataSource,
+      @JsonProperty("segmentIds") Set<String> segmentIds
+  )
+  {
+    this.dataSource = dataSource;
+    this.segmentIds = segmentIds;
+  }
+
+  @JsonProperty
+  public String getDataSource()
+  {
+    return dataSource;
+  }
+
+  @JsonProperty
+  public Set<String> getSegmentIds()
+  {
+    return segmentIds;
+  }
+
+  @Override
+  public TypeReference<UpgradedToSegmentsResponse> getReturnTypeReference()
+  {
+    return new TypeReference<UpgradedToSegmentsResponse>()
+    {
+    };
+  }
+
+  @Override
+  public UpgradedToSegmentsResponse perform(Task task, TaskActionToolbox toolbox)
+  {
+    return new UpgradedToSegmentsResponse(
+        toolbox.getIndexerMetadataStorageCoordinator()
+               .retrieveUpgradedToSegmentIds(dataSource, segmentIds)
+    );
+  }
+
+  @Override
+  public boolean isAudited()
+  {
+    return false;
+  }
+
+  @Override
+  public String toString()
+  {
+    return getClass().getSimpleName() + "{" +
+           "dataSource='" + dataSource + '\'' +
+           ", segmentIds=" + segmentIds +
+           '}';
+  }
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
index 4606bd597a8..973a83ecee4 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
@@ -39,6 +39,8 @@ import java.util.concurrent.Future;
     @JsonSubTypes.Type(name = "segmentTransactionalAppend", value = SegmentTransactionalAppendAction.class),
     @JsonSubTypes.Type(name = "segmentTransactionalReplace", value = SegmentTransactionalReplaceAction.class),
     @JsonSubTypes.Type(name = "retrieveSegmentsById", value = RetrieveSegmentsByIdAction.class),
+    @JsonSubTypes.Type(name = "retrieveUpgradedFromSegmentIds", value = RetrieveUpgradedFromSegmentIdsAction.class),
+    @JsonSubTypes.Type(name = "retrieveUpgradedToSegmentIds", value = RetrieveUpgradedToSegmentIdsAction.class),
     @JsonSubTypes.Type(name = "segmentListUsed", value = RetrieveUsedSegmentsAction.class),
     @JsonSubTypes.Type(name = "segmentListUnused", value = RetrieveUnusedSegmentsAction.class),
     @JsonSubTypes.Type(name = "markSegmentsAsUnused", value = MarkSegmentsAsUnusedAction.class),
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/UpgradedFromSegmentsResponse.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/UpgradedFromSegmentsResponse.java
new file mode 100644
index 00000000000..5f0f1775f16
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/UpgradedFromSegmentsResponse.java
@@ -0,0 +1,44 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.Map;
+
+public class UpgradedFromSegmentsResponse
+{
+  private final Map<String, String> upgradedFromSegmentIds;
+
+  @JsonCreator
+  public UpgradedFromSegmentsResponse(
+      @JsonProperty("upgradedFromSegmentIds") Map<String, String> upgradedFromSegmentIds
+  )
+  {
+    this.upgradedFromSegmentIds = upgradedFromSegmentIds;
+  }
+
+  @JsonProperty
+  public Map<String, String> getUpgradedFromSegmentIds()
+  {
+    return upgradedFromSegmentIds;
+  }
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/UpgradedToSegmentsResponse.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/UpgradedToSegmentsResponse.java
new file mode 100644
index 00000000000..e9bf33a97ce
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/UpgradedToSegmentsResponse.java
@@ -0,0 +1,46 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.Map;
+import java.util.Set;
+
+public class UpgradedToSegmentsResponse
+{
+
+  private final Map<String, Set<String>> upgradedToSegmentIds;
+
+  @JsonCreator
+  public UpgradedToSegmentsResponse(
+      @JsonProperty("upgradedToSegmentIds") Map<String, Set<String>> upgradedToSegmentIds
+  )
+  {
+    this.upgradedToSegmentIds = upgradedToSegmentIds;
+  }
+
+  @JsonProperty
+  public Map<String, Set<String>> getUpgradedToSegmentIds()
+  {
+    return upgradedToSegmentIds;
+  }
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTask.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTask.java
index fe49569a3bb..e1f6d2915ee 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTask.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTask.java
@@ -35,11 +35,14 @@ import org.apache.druid.indexing.common.TaskLock;
 import org.apache.druid.indexing.common.TaskLockType;
 import org.apache.druid.indexing.common.TaskToolbox;
 import org.apache.druid.indexing.common.actions.RetrieveUnusedSegmentsAction;
+import org.apache.druid.indexing.common.actions.RetrieveUpgradedFromSegmentIdsAction;
+import org.apache.druid.indexing.common.actions.RetrieveUpgradedToSegmentIdsAction;
 import org.apache.druid.indexing.common.actions.RetrieveUsedSegmentsAction;
 import org.apache.druid.indexing.common.actions.SegmentNukeAction;
 import org.apache.druid.indexing.common.actions.TaskActionClient;
 import org.apache.druid.indexing.common.actions.TaskLocks;
 import org.apache.druid.indexing.common.actions.TimeChunkLockTryAcquireAction;
+import org.apache.druid.indexing.common.actions.UpgradedToSegmentsResponse;
 import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
@@ -47,6 +50,8 @@ import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.server.lookup.cache.LookupLoadingSpec;
 import org.apache.druid.server.security.ResourceAction;
 import org.apache.druid.timeline.DataSegment;
+import org.apache.druid.timeline.SegmentId;
+import org.apache.druid.utils.CollectionUtils;
 import org.joda.time.DateTime;
 import org.joda.time.Interval;
 
@@ -54,6 +59,7 @@ import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
 import java.io.IOException;
 import java.util.ArrayList;
+import java.util.HashMap;
 import java.util.HashSet;
 import java.util.List;
 import java.util.Map;
@@ -63,9 +69,23 @@ import java.util.TreeMap;
 import java.util.stream.Collectors;
 
 /**
+ * <p/>
  * The client representation of this task is {@link ClientKillUnusedSegmentsTaskQuery}.
  * JSON serialization fields of this class must correspond to those of {@link
  * ClientKillUnusedSegmentsTaskQuery}, except for {@link #id} and {@link #context} fields.
+ * <p/>
+ * The Kill task fetches the set of used segments for the interval and computes the set of their load specs. <br/>
+ * Until `limit` segments have been processed in total or all segments for the interval have been nuked:
+ * <ol>
+ * <li> Fetch at most `batchSize` unused segments from the metadata store. </li>
+ * <li> Determine the mapping from these segments to their parents *before* nuking the segments. </li>
+ * <li> Nuke the batch of unused segments from the metadata store. </li>
+ * <li> Determine the mapping of the set of parents to all their children. </li>
+ * <li> Check if unused or parent segments exist. </li>
+ * <li> Find the unreferenced segments. </li>
+ * <li> Filter the set of unreferenced segments using load specs from the set of used segments. </li>
+ * <li> Kill the filtered set of segments from deep storage. </li>
+ * </ol>
  */
 public class KillUnusedSegmentsTask extends AbstractFixedIntervalTask
 {
@@ -76,7 +96,7 @@ public class KillUnusedSegmentsTask extends AbstractFixedIntervalTask
    * Default nuke batch size. This is a small enough size that we still get value from batching, while
    * yielding as quickly as possible. In one real cluster environment backed with mysql, ~2000rows/sec,
    * with batch size of 100, means a batch should only less than a second for the task lock, and depending
-   * on the segment store latency, unoptimised S3 cleanups typically take 5-10 seconds per 100. Over time
+   * on the segment store latency, unoptimised S3 cleanups typically take 5-10 seconds per 100. Over time,
    * we expect the S3 cleanup to get quicker, so this should be < 1 second, which means we'll be yielding
    * the task lockbox every 1-2 seconds.
    */
@@ -97,13 +117,15 @@ public class KillUnusedSegmentsTask extends AbstractFixedIntervalTask
   /**
    * Maximum number of segments that can be killed.
    */
-  @Nullable private final Integer limit;
+  @Nullable
+  private final Integer limit;
 
   /**
    * The maximum used status last updated time. Any segments with
    * {@code used_status_last_updated} no later than this time will be included in the kill task.
    */
-  @Nullable private final DateTime maxUsedStatusLastUpdatedTime;
+  @Nullable
+  private final DateTime maxUsedStatusLastUpdatedTime;
 
   @JsonCreator
   public KillUnusedSegmentsTask(
@@ -196,18 +218,17 @@ public class KillUnusedSegmentsTask extends AbstractFixedIntervalTask
         numTotalBatches != null ? StringUtils.format(" in [%d] batches.", numTotalBatches) : "."
     );
 
+    final TaskActionClient taskActionClient = toolbox.getTaskActionClient();
     RetrieveUsedSegmentsAction retrieveUsedSegmentsAction = new RetrieveUsedSegmentsAction(
             getDataSource(),
             ImmutableList.of(getInterval()),
             Segments.INCLUDING_OVERSHADOWED
     );
     // Fetch the load specs of all segments overlapping with the unused segment intervals
-    final Set<Map<String, Object>> usedSegmentLoadSpecs =
-            new HashSet<>(toolbox.getTaskActionClient().submit(retrieveUsedSegmentsAction)
-                    .stream()
-                    .map(DataSegment::getLoadSpec)
-                    .collect(Collectors.toSet())
-            );
+    final Set<Map<String, Object>> usedSegmentLoadSpecs = taskActionClient.submit(retrieveUsedSegmentsAction)
+                                                                          .stream()
+                                                                          .map(DataSegment::getLoadSpec)
+                                                                          .collect(Collectors.toSet());
 
     do {
       if (nextBatchSize <= 0) {
@@ -231,20 +252,47 @@ public class KillUnusedSegmentsTask extends AbstractFixedIntervalTask
         );
       }
 
-      // Kill segments
-      // Order is important here: we want the nuke action to clean up the metadata records _before_ the
-      // segments are removed from storage, this helps maintain that we will always have a storage segment if
-      // the metadata segment is present. If the segment nuke throws an exception, then the segment cleanup is
-      // abandoned.
+      // Kill segments. Order is important here:
+      // Retrieve the segment upgrade infos for the batch _before_ the segments are nuked
+      // We then want the nuke action to clean up the metadata records _before_ the segments are removed from storage.
+      // This helps maintain that we will always have a storage segment if the metadata segment is present.
+      // Determine the subset of segments to be killed from deep storage based on loadspecs.
+      // If the segment nuke throws an exception, then the segment cleanup is abandoned.
 
-      toolbox.getTaskActionClient().submit(new SegmentNukeAction(new HashSet<>(unusedSegments)));
+      // Determine upgraded segment ids before nuking
+      final Set<String> segmentIds = unusedSegments.stream()
+                                                   .map(DataSegment::getId)
+                                                   .map(SegmentId::toString)
+                                                   .collect(Collectors.toSet());
+      final Map<String, String> upgradedFromSegmentIds = new HashMap<>();
+      try {
+        upgradedFromSegmentIds.putAll(
+            taskActionClient.submit(
+                new RetrieveUpgradedFromSegmentIdsAction(getDataSource(), segmentIds)
+            ).getUpgradedFromSegmentIds()
+        );
+      }
+      catch (Exception e) {
+        LOG.warn(
+            e,
+            "Could not retrieve parent segment ids using task action[retrieveUpgradedFromSegmentIds]."
+            + " Overlord may be on an older version."
+        );
+      }
 
-      // Kill segments from the deep storage only if their load specs are not being used by any used segments
-      final List<DataSegment> segmentsToBeKilled = unusedSegments
-          .stream()
-          .filter(unusedSegment -> unusedSegment.getLoadSpec() == null
-                                   || !usedSegmentLoadSpecs.contains(unusedSegment.getLoadSpec()))
-          .collect(Collectors.toList());
+      // Nuke Segments
+      taskActionClient.submit(new SegmentNukeAction(new HashSet<>(unusedSegments)));
+
+      // Determine segments to be killed
+      final List<DataSegment> segmentsToBeKilled
+          = getKillableSegments(unusedSegments, upgradedFromSegmentIds, usedSegmentLoadSpecs, taskActionClient);
+
+      final Set<DataSegment> segmentsNotKilled = new HashSet<>(unusedSegments);
+      segmentsToBeKilled.forEach(segmentsNotKilled::remove);
+      LOG.infoSegments(
+          segmentsNotKilled,
+          "Skipping segment kill from deep storage as their load specs are referenced by other segments."
+      );
 
       toolbox.getDataSegmentKiller().kill(segmentsToBeKilled);
       numBatchesProcessed++;
@@ -253,7 +301,7 @@ public class KillUnusedSegmentsTask extends AbstractFixedIntervalTask
       LOG.info("Processed [%d] batches for kill task[%s].", numBatchesProcessed, getId());
 
       nextBatchSize = computeNextBatchSize(numSegmentsKilled);
-    } while (unusedSegments.size() != 0 && (null == numTotalBatches || numBatchesProcessed < numTotalBatches));
+    } while (!unusedSegments.isEmpty() && (null == numTotalBatches || numBatchesProcessed < numTotalBatches));
 
     final String taskId = getId();
     LOG.info(
@@ -300,6 +348,64 @@ public class KillUnusedSegmentsTask extends AbstractFixedIntervalTask
     return taskLockMap;
   }
 
+  /**
+   * Determines subset of segments without referenced load specs that can be safely killed by
+   * looking at the segment upgrades and used segment load specs
+   * @param unusedSegments input segments
+   * @param upgradedFromSegmentIds segment to parent mapping
+   * @param usedSegmentLoadSpecs load specs of used segments
+   * @param taskActionClient task action client
+   * @return list of segments to kill from deep storage
+   */
+  private List<DataSegment> getKillableSegments(
+      List<DataSegment> unusedSegments,
+      Map<String, String> upgradedFromSegmentIds,
+      Set<Map<String, Object>> usedSegmentLoadSpecs,
+      TaskActionClient taskActionClient
+  )
+  {
+
+    // Determine parentId for each unused segment
+    final Map<String, Set<DataSegment>> parentIdToUnusedSegments = new HashMap<>();
+    for (DataSegment segment : unusedSegments) {
+      final String segmentId = segment.getId().toString();
+      parentIdToUnusedSegments.computeIfAbsent(
+          upgradedFromSegmentIds.getOrDefault(segmentId, segmentId),
+          k -> new HashSet<>()
+      ).add(segment);
+    }
+
+    // Check if the parent or any of its children exist in metadata store
+    try {
+      UpgradedToSegmentsResponse response = taskActionClient.submit(
+          new RetrieveUpgradedToSegmentIdsAction(getDataSource(), parentIdToUnusedSegments.keySet())
+      );
+      if (response != null && response.getUpgradedToSegmentIds() != null) {
+        response.getUpgradedToSegmentIds().forEach((parent, children) -> {
+          if (!CollectionUtils.isNullOrEmpty(children)) {
+            // Do not kill segment if its parent or any of its siblings still exist in metadata store
+            parentIdToUnusedSegments.remove(parent);
+          }
+        });
+      }
+    }
+    catch (Exception e) {
+      LOG.warn(
+          e,
+          "Could not retrieve referenced ids using task action[retrieveUpgradedToSegmentIds]."
+          + " Overlord may be on an older version."
+      );
+    }
+
+    // Filter using the used segment load specs as segment upgrades predate the above task action
+    return parentIdToUnusedSegments.values()
+                                   .stream()
+                                   .flatMap(Set::stream)
+                                   .filter(segment -> !usedSegmentLoadSpecs.contains(segment.getLoadSpec()))
+                                   .collect(Collectors.toList());
+  }
+
+
   @Override
   public LookupLoadingSpec getLookupLoadingSpec()
   {
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IngestionTestBase.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IngestionTestBase.java
index 133ced3907d..d6687efbf34 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IngestionTestBase.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/IngestionTestBase.java
@@ -61,6 +61,7 @@ import org.apache.druid.indexing.overlord.TaskRunnerWorkItem;
 import org.apache.druid.indexing.overlord.TaskStorage;
 import org.apache.druid.indexing.overlord.autoscaling.ScalingStats;
 import org.apache.druid.indexing.overlord.supervisor.SupervisorManager;
+import org.apache.druid.indexing.test.TestDataSegmentKiller;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Pair;
 import org.apache.druid.java.util.common.RE;
@@ -81,7 +82,6 @@ import org.apache.druid.segment.incremental.RowIngestionMetersFactory;
 import org.apache.druid.segment.join.NoopJoinableFactory;
 import org.apache.druid.segment.loading.LocalDataSegmentPusher;
 import org.apache.druid.segment.loading.LocalDataSegmentPusherConfig;
-import org.apache.druid.segment.loading.NoopDataSegmentKiller;
 import org.apache.druid.segment.loading.SegmentCacheManager;
 import org.apache.druid.segment.metadata.CentralizedDatasourceSchemaConfig;
 import org.apache.druid.segment.metadata.SegmentSchemaCache;
@@ -130,6 +130,7 @@ public abstract class IngestionTestBase extends InitializedNullHandlingTest
   private SegmentSchemaManager segmentSchemaManager;
   private SegmentSchemaCache segmentSchemaCache;
   private SupervisorManager supervisorManager;
+  private TestDataSegmentKiller dataSegmentKiller;
   protected File reportsFile;
 
   @Before
@@ -169,6 +170,7 @@ public abstract class IngestionTestBase extends InitializedNullHandlingTest
     lockbox = new TaskLockbox(taskStorage, storageCoordinator);
     segmentCacheManagerFactory = new SegmentCacheManagerFactory(TestIndex.INDEX_IO, getObjectMapper());
     reportsFile = temporaryFolder.newFile();
+    dataSegmentKiller = new TestDataSegmentKiller();
   }
 
   @After
@@ -243,6 +245,11 @@ public abstract class IngestionTestBase extends InitializedNullHandlingTest
     return testUtils.getRowIngestionMetersFactory();
   }
 
+  public TestDataSegmentKiller getDataSegmentKiller()
+  {
+    return dataSegmentKiller;
+  }
+
   public TaskActionToolbox createTaskActionToolbox()
   {
     storageCoordinator.start();
@@ -265,7 +272,7 @@ public abstract class IngestionTestBase extends InitializedNullHandlingTest
         .taskExecutorNode(new DruidNode("druid/middlemanager", "localhost", false, 8091, null, true, false))
         .taskActionClient(createActionClient(task))
         .segmentPusher(new LocalDataSegmentPusher(new LocalDataSegmentPusherConfig()))
-        .dataSegmentKiller(new NoopDataSegmentKiller())
+        .dataSegmentKiller(dataSegmentKiller)
         .joinableFactory(NoopJoinableFactory.INSTANCE)
         .jsonMapper(objectMapper)
         .taskWorkDir(baseDir)
@@ -450,7 +457,7 @@ public abstract class IngestionTestBase extends InitializedNullHandlingTest
             .taskExecutorNode(new DruidNode("druid/middlemanager", "localhost", false, 8091, null, true, false))
             .taskActionClient(taskActionClient)
             .segmentPusher(new LocalDataSegmentPusher(new LocalDataSegmentPusherConfig()))
-            .dataSegmentKiller(new NoopDataSegmentKiller())
+            .dataSegmentKiller(dataSegmentKiller)
             .joinableFactory(NoopJoinableFactory.INSTANCE)
             .jsonMapper(objectMapper)
             .taskWorkDir(baseDir)
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTaskTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTaskTest.java
index f888ace5a54..fe2b5a51c86 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTaskTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/KillUnusedSegmentsTaskTest.java
@@ -36,6 +36,7 @@ import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.JodaUtils;
+import org.apache.druid.metadata.IndexerSqlMetadataStorageCoordinatorTestBase;
 import org.apache.druid.server.lookup.cache.LookupLoadingSpec;
 import org.apache.druid.timeline.DataSegment;
 import org.assertj.core.api.Assertions;
@@ -72,10 +73,10 @@ public class KillUnusedSegmentsTaskTest extends IngestionTestBase
     taskRunner = new TestTaskRunner();
 
     final String version = DateTimes.nowUtc().toString();
-    segment1 = newSegment(Intervals.of("2019-01-01/2019-02-01"), version);
-    segment2 = newSegment(Intervals.of("2019-02-01/2019-03-01"), version);
-    segment3 = newSegment(Intervals.of("2019-03-01/2019-04-01"), version);
-    segment4 = newSegment(Intervals.of("2019-04-01/2019-05-01"), version);
+    segment1 = newSegment(Intervals.of("2019-01-01/2019-02-01"), version).withLoadSpec(ImmutableMap.of("k", 1));
+    segment2 = newSegment(Intervals.of("2019-02-01/2019-03-01"), version).withLoadSpec(ImmutableMap.of("k", 2));
+    segment3 = newSegment(Intervals.of("2019-03-01/2019-04-01"), version).withLoadSpec(ImmutableMap.of("k", 3));
+    segment4 = newSegment(Intervals.of("2019-04-01/2019-05-01"), version).withLoadSpec(ImmutableMap.of("k", 4));
   }
 
   @Test
@@ -125,6 +126,212 @@ public class KillUnusedSegmentsTaskTest extends IngestionTestBase
         new KillTaskReport.Stats(1, 2),
         getReportedStats()
     );
+    Assert.assertEquals(ImmutableSet.of(segment3), getDataSegmentKiller().getKilledSegments());
+  }
+
+  @Test
+  public void testKillSegmentsDeleteUnreferencedSiblings() throws Exception
+  {
+    final Map<String, String> upgradeSegmentMapping = ImmutableMap.of(
+        segment1.getId().toString(),
+        "nonExistentParent",
+        segment2.getId().toString(),
+        "nonExistentParent"
+    );
+    insertUsedSegments(ImmutableSet.of(segment1, segment2), upgradeSegmentMapping);
+    getStorageCoordinator().markSegmentsAsUnusedWithinInterval(DATA_SOURCE, Intervals.ETERNITY);
+
+
+    final KillUnusedSegmentsTask task = new KillUnusedSegmentsTaskBuilder()
+        .dataSource(DATA_SOURCE)
+        .interval(Intervals.ETERNITY)
+        .build();
+
+    Assert.assertEquals(TaskState.SUCCESS, taskRunner.run(task).get().getStatusCode());
+
+    final List<DataSegment> observedUnusedSegments =
+        getMetadataStorageCoordinator().retrieveUnusedSegmentsForInterval(
+            DATA_SOURCE,
+            Intervals.ETERNITY,
+            null,
+            null,
+            null
+        );
+
+    Assert.assertEquals(Collections.emptyList(), observedUnusedSegments);
+
+    Assert.assertEquals(
+        new KillTaskReport.Stats(2, 2),
+        getReportedStats()
+    );
+    Assert.assertEquals(ImmutableSet.of(segment1, segment2), getDataSegmentKiller().getKilledSegments());
+  }
+
+  @Test
+  public void testKillSegmentsDoNotDeleteReferencedSibling() throws Exception
+  {
+    final Map<String, String> upgradeSegmentMapping = ImmutableMap.of(
+        segment1.getId().toString(),
+        "nonExistentParent",
+        segment2.getId().toString(),
+        "nonExistentParent"
+    );
+    insertUsedSegments(ImmutableSet.of(segment1, segment2), upgradeSegmentMapping);
+    getStorageCoordinator().markSegmentsAsUnusedWithinInterval(DATA_SOURCE, Intervals.ETERNITY);
+
+
+    final KillUnusedSegmentsTask task = new KillUnusedSegmentsTaskBuilder()
+        .dataSource(DATA_SOURCE)
+        .interval(segment1.getInterval())
+        .build();
+
+    Assert.assertEquals(TaskState.SUCCESS, taskRunner.run(task).get().getStatusCode());
+
+    final List<DataSegment> observedUnusedSegments =
+        getMetadataStorageCoordinator().retrieveUnusedSegmentsForInterval(
+            DATA_SOURCE,
+            Intervals.ETERNITY,
+            null,
+            null,
+            null
+        );
+
+    Assert.assertEquals(Collections.singletonList(segment2), observedUnusedSegments);
+
+    Assert.assertEquals(
+        new KillTaskReport.Stats(0, 2),
+        getReportedStats()
+    );
+    Assert.assertEquals(Collections.emptySet(), getDataSegmentKiller().getKilledSegments());
+  }
+
+  @Test
+  public void testKillSegmentsDoNotDeleteParentWithReferencedChildren() throws Exception
+  {
+    final Map<String, String> upgradeSegmentMapping = ImmutableMap.of(
+        segment1.getId().toString(),
+        segment3.getId().toString(),
+        segment2.getId().toString(),
+        segment3.getId().toString()
+    );
+    insertUsedSegments(ImmutableSet.of(segment1, segment2, segment3), upgradeSegmentMapping);
+    getSegmentsMetadataManager().markSegmentAsUnused(segment2.getId());
+    getSegmentsMetadataManager().markSegmentAsUnused(segment3.getId());
+
+
+    final KillUnusedSegmentsTask task = new KillUnusedSegmentsTaskBuilder()
+        .dataSource(DATA_SOURCE)
+        .interval(Intervals.ETERNITY)
+        .build();
+
+    Assert.assertEquals(TaskState.SUCCESS, taskRunner.run(task).get().getStatusCode());
+
+    final List<DataSegment> observedUnusedSegments =
+        getMetadataStorageCoordinator().retrieveUnusedSegmentsForInterval(
+            DATA_SOURCE,
+            Intervals.ETERNITY,
+            null,
+            null,
+            null
+        );
+    Assert.assertEquals(ImmutableList.of(), observedUnusedSegments);
+    Assertions.assertThat(
+        getMetadataStorageCoordinator().retrieveUsedSegmentsForInterval(
+            DATA_SOURCE,
+            Intervals.ETERNITY,
+            Segments.ONLY_VISIBLE
+        )
+    ).containsExactlyInAnyOrder(segment1);
+
+    Assert.assertEquals(
+        new KillTaskReport.Stats(0, 2),
+        getReportedStats()
+    );
+    Assert.assertEquals(Collections.emptySet(), getDataSegmentKiller().getKilledSegments());
+  }
+
+  @Test
+  public void testKillSegmentsDoNotDeleteChildrenWithReferencedParent() throws Exception
+  {
+    final Map<String, String> upgradeSegmentMapping = ImmutableMap.of(
+        segment1.getId().toString(),
+        segment3.getId().toString(),
+        segment2.getId().toString(),
+        segment3.getId().toString()
+    );
+    insertUsedSegments(ImmutableSet.of(segment1, segment2, segment3), upgradeSegmentMapping);
+    getSegmentsMetadataManager().markSegmentAsUnused(segment1.getId());
+    getSegmentsMetadataManager().markSegmentAsUnused(segment2.getId());
+
+
+    final KillUnusedSegmentsTask task = new KillUnusedSegmentsTaskBuilder()
+        .dataSource(DATA_SOURCE)
+        .interval(Intervals.ETERNITY)
+        .build();
+
+    Assert.assertEquals(TaskState.SUCCESS, taskRunner.run(task).get().getStatusCode());
+
+    final List<DataSegment> observedUnusedSegments =
+        getMetadataStorageCoordinator().retrieveUnusedSegmentsForInterval(
+            DATA_SOURCE,
+            Intervals.ETERNITY,
+            null,
+            null,
+            null
+        );
+    Assert.assertEquals(ImmutableList.of(), observedUnusedSegments);
+    Assertions.assertThat(
+        getMetadataStorageCoordinator().retrieveUsedSegmentsForInterval(
+            DATA_SOURCE,
+            Intervals.ETERNITY,
+            Segments.ONLY_VISIBLE
+        )
+    ).containsExactlyInAnyOrder(segment3);
+
+    Assert.assertEquals(
+        new KillTaskReport.Stats(0, 2),
+        getReportedStats()
+    );
+    Assert.assertEquals(Collections.emptySet(), getDataSegmentKiller().getKilledSegments());
+  }
+
+  @Test
+  public void testKillSegmentsDeleteChildrenAndParent() throws Exception
+  {
+    final Map<String, String> upgradeSegmentMapping = ImmutableMap.of(
+        segment1.getId().toString(),
+        segment3.getId().toString(),
+        segment2.getId().toString(),
+        segment3.getId().toString()
+    );
+    insertUsedSegments(ImmutableSet.of(segment1, segment2, segment3), upgradeSegmentMapping);
+    getSegmentsMetadataManager().markSegmentAsUnused(segment1.getId());
+    getSegmentsMetadataManager().markSegmentAsUnused(segment2.getId());
+    getSegmentsMetadataManager().markSegmentAsUnused(segment3.getId());
+
+
+    final KillUnusedSegmentsTask task = new KillUnusedSegmentsTaskBuilder()
+        .dataSource(DATA_SOURCE)
+        .interval(Intervals.ETERNITY)
+        .build();
+
+    Assert.assertEquals(TaskState.SUCCESS, taskRunner.run(task).get().getStatusCode());
+
+    final List<DataSegment> observedUnusedSegments =
+        getMetadataStorageCoordinator().retrieveUnusedSegmentsForInterval(
+            DATA_SOURCE,
+            Intervals.ETERNITY,
+            null,
+            null,
+            null
+        );
+    Assert.assertEquals(ImmutableList.of(), observedUnusedSegments);
+
+    Assert.assertEquals(
+        new KillTaskReport.Stats(3, 2),
+        getReportedStats()
+    );
+    Assert.assertEquals(ImmutableSet.of(segment1, segment2, segment3), getDataSegmentKiller().getKilledSegments());
   }
 
   @Test
@@ -1247,4 +1454,16 @@ public class KillUnusedSegmentsTaskTest extends IngestionTestBase
         10L
     );
   }
+
+  private void insertUsedSegments(Set<DataSegment> segments, Map<String, String> upgradedFromSegmentIdMap)
+  {
+    final String table = derbyConnectorRule.metadataTablesConfigSupplier().get().getSegmentsTable();
+    IndexerSqlMetadataStorageCoordinatorTestBase.insertUsedSegments(
+        segments,
+        upgradedFromSegmentIdMap,
+        derbyConnectorRule.getConnector(),
+        table,
+        getObjectMapper()
+    );
+  }
 }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestDataSegmentKiller.java b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestDataSegmentKiller.java
index 33421eb1a5c..92581f6dd1e 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestDataSegmentKiller.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestDataSegmentKiller.java
@@ -22,12 +22,18 @@ package org.apache.druid.indexing.test;
 import org.apache.druid.segment.loading.DataSegmentKiller;
 import org.apache.druid.timeline.DataSegment;
 
+import java.util.HashSet;
+import java.util.Set;
+
 public class TestDataSegmentKiller implements DataSegmentKiller
 {
+
+  private final Set<DataSegment> killedSegments = new HashSet<>();
+
   @Override
   public void kill(DataSegment segment)
   {
-    // do nothing
+    killedSegments.add(segment);
   }
 
   @Override
@@ -35,4 +41,9 @@ public class TestDataSegmentKiller implements DataSegmentKiller
   {
     throw new UnsupportedOperationException("not implemented");
   }
+
+  public Set<DataSegment> getKilledSegments()
+  {
+    return killedSegments;
+  }
 }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
index 61a57e94842..d2055d6e0c9 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
@@ -314,6 +314,24 @@ public class TestIndexerMetadataStorageCoordinator implements IndexerMetadataSto
     throw new UnsupportedOperationException();
   }
 
+  @Override
+  public Map<String, String> retrieveUpgradedFromSegmentIds(
+      final String dataSource,
+      final Set<String> segmentIds
+  )
+  {
+    return Collections.emptyMap();
+  }
+
+  @Override
+  public Map<String, Set<String>> retrieveUpgradedToSegmentIds(
+      final String dataSource,
+      final Set<String> segmentIds
+  )
+  {
+    return Collections.emptyMap();
+  }
+
   public Set<DataSegment> getPublished()
   {
     return ImmutableSet.copyOf(published);
diff --git a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
index c055a8d9e9f..83b4ac7e474 100644
--- a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
@@ -473,4 +473,21 @@ public interface IndexerMetadataStorageCoordinator
    * @return List of pending segment records
    */
   List<PendingSegmentRecord> getPendingSegments(String datasource, Interval interval);
+
+  /**
+   * Map from a segment ID to the segment ID from which it was upgraded
+   * There should be no entry in the map for an original non-upgraded segment
+   * @param dataSource data source
+   * @param segmentIds ids of segments
+   */
+  Map<String, String> retrieveUpgradedFromSegmentIds(String dataSource, Set<String> segmentIds);
+
+  /**
+   * Map from a segment ID to a set containing
+   * 1) all segment IDs that were upgraded from it AND are still present in the metadata store
+   * 2) the segment ID itself if and only if it is still present in the metadata store
+   * @param dataSource data source
+   * @param segmentIds ids of the first segments which had the corresponding load spec
+   */
+  Map<String, Set<String>> retrieveUpgradedToSegmentIds(String dataSource, Set<String> segmentIds);
 }
diff --git a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
index fd637728908..54f75ccb920 100644
--- a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
@@ -564,6 +564,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
                 createNewIdsOfAppendSegmentsAfterReplace(handle, replaceSegments, locksHeldByReplaceTask);
 
             Map<SegmentId, SegmentMetadata> upgradeSegmentMetadata = new HashMap<>();
+            final Map<String, String> upgradedFromSegmentIdMap = new HashMap<>();
             for (DataSegmentPlus dataSegmentPlus : upgradedSegments) {
               segmentsToInsert.add(dataSegmentPlus.getDataSegment());
               if (dataSegmentPlus.getSchemaFingerprint() != null && dataSegmentPlus.getNumRows() != null) {
@@ -572,6 +573,12 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
                     new SegmentMetadata(dataSegmentPlus.getNumRows(), dataSegmentPlus.getSchemaFingerprint())
                 );
               }
+              if (dataSegmentPlus.getUpgradedFromSegmentId() != null) {
+                upgradedFromSegmentIdMap.put(
+                    dataSegmentPlus.getDataSegment().getId().toString(),
+                    dataSegmentPlus.getUpgradedFromSegmentId()
+                );
+              }
             }
             SegmentPublishResult result = SegmentPublishResult.ok(
                 insertSegments(
@@ -579,7 +586,8 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
                     segmentsToInsert,
                     segmentSchemaMapping,
                     upgradeSegmentMetadata,
-                    Collections.emptyMap()
+                    Collections.emptyMap(),
+                    upgradedFromSegmentIdMap
                 ),
                 upgradePendingSegmentsOverlappingWith(segmentsToInsert)
             );
@@ -1408,6 +1416,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
     final Set<DataSegment> allSegmentsToInsert = new HashSet<>(appendSegments);
     final Map<SegmentId, SegmentId> newVersionSegmentToParent = new HashMap<>();
     final Map<String, DataSegment> segmentIdMap = new HashMap<>();
+    final Map<String, String> upgradedFromSegmentIdMap = new HashMap<>();
     appendSegments.forEach(segment -> segmentIdMap.put(segment.getId().toString(), segment));
     segmentIdsForNewVersions.forEach(
         pendingSegment -> {
@@ -1415,6 +1424,7 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
             final DataSegment oldSegment = segmentIdMap.get(pendingSegment.getUpgradedFromSegmentId());
             final SegmentId newVersionSegmentId = pendingSegment.getId().asSegmentId();
             newVersionSegmentToParent.put(newVersionSegmentId, oldSegment.getId());
+            upgradedFromSegmentIdMap.put(newVersionSegmentId.toString(), oldSegment.getId().toString());
             allSegmentsToInsert.add(
                 new DataSegment(
                     pendingSegment.getId().asSegmentId(),
@@ -1473,7 +1483,8 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
                     allSegmentsToInsert,
                     segmentSchemaMapping,
                     Collections.emptyMap(),
-                    newVersionSegmentToParent
+                    newVersionSegmentToParent,
+                    upgradedFromSegmentIdMap
                 )
             );
           },
@@ -2092,7 +2103,8 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
               .bind("version", segment.getVersion())
               .bind("used", usedSegments.contains(segment))
               .bind("payload", jsonMapper.writeValueAsBytes(segment))
-              .bind("used_status_last_updated", now);
+              .bind("used_status_last_updated", now)
+              .bind("upgraded_from_segment_id", (String) null);
 
           if (schemaPersistEnabled) {
             Long numRows = null;
@@ -2217,6 +2229,11 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
                                            .shardSpec(shardSpec)
                                            .build();
 
+      // When the segment already has an upgraded_from_segment_id, reuse it for its children
+      final String upgradedFromSegmentId = oldSegmentMetadata.getUpgradedFromSegmentId() == null
+                                           ? oldSegmentMetadata.getDataSegment().getId().toString()
+                                           : oldSegmentMetadata.getUpgradedFromSegmentId();
+
       upgradedSegments.add(
           new DataSegmentPlus(
               dataSegment,
@@ -2224,7 +2241,9 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
               null,
               null,
               oldSegmentMetadata.getSchemaFingerprint(),
-              oldSegmentMetadata.getNumRows())
+              oldSegmentMetadata.getNumRows(),
+              upgradedFromSegmentId
+          )
       );
     }
 
@@ -2266,7 +2285,8 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
       Set<DataSegment> segments,
       @Nullable SegmentSchemaMapping segmentSchemaMapping,
       Map<SegmentId, SegmentMetadata> upgradeSegmentMetadata,
-      Map<SegmentId, SegmentId> newVersionForAppendToParent
+      Map<SegmentId, SegmentId> newVersionForAppendToParent,
+      Map<String, String> upgradedFromSegmentIdMap
   ) throws IOException
   {
     boolean shouldPersistSchema = shouldPersistSchema(segmentSchemaMapping);
@@ -2302,7 +2322,8 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
                  .bind("version", segment.getVersion())
                  .bind("used", true)
                  .bind("payload", jsonMapper.writeValueAsBytes(segment))
-                 .bind("used_status_last_updated", now);
+                 .bind("used_status_last_updated", now)
+                 .bind("upgraded_from_segment_id", upgradedFromSegmentIdMap.get(segment.getId().toString()));
 
         if (schemaPersistEnabled) {
           SegmentMetadata segmentMetadata =
@@ -2449,9 +2470,9 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
   {
     String insertStatement =
         "INSERT INTO %1$s (id, dataSource, created_date, start, %2$send%2$s,"
-        + " partitioned, version, used, payload, used_status_last_updated %3$s) "
+        + " partitioned, version, used, payload, used_status_last_updated, upgraded_from_segment_id %3$s) "
         + "VALUES (:id, :dataSource, :created_date, :start, :end,"
-        + " :partitioned, :version, :used, :payload, :used_status_last_updated %4$s)";
+        + " :partitioned, :version, :used, :payload, :used_status_last_updated, :upgraded_from_segment_id %4$s)";
 
     if (schemaPersistEnabled) {
       return StringUtils.format(
@@ -2923,6 +2944,87 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
     );
   }
 
+  @Override
+  public Map<String, String> retrieveUpgradedFromSegmentIds(
+      final String dataSource,
+      final Set<String> segmentIds
+  )
+  {
+    if (segmentIds.isEmpty()) {
+      return Collections.emptyMap();
+    }
+
+    final List<String> segmentIdList = ImmutableList.copyOf(segmentIds);
+    final String sql = StringUtils.format(
+        "SELECT id, upgraded_from_segment_id FROM %s WHERE dataSource = :dataSource %s",
+        dbTables.getSegmentsTable(),
+        SqlSegmentsMetadataQuery.getParameterizedInConditionForColumn("id", segmentIdList)
+    );
+    final Map<String, String> upgradedFromSegmentIds = new HashMap<>();
+    connector.retryWithHandle(
+        handle -> {
+          Query<Map<String, Object>> query = handle.createQuery(sql)
+                                                   .bind("dataSource", dataSource);
+          SqlSegmentsMetadataQuery.bindColumnValuesToQueryWithInCondition("id", segmentIdList, query);
+          return query.map((index, r, ctx) -> {
+            final String id = r.getString(1);
+            final String upgradedFromSegmentId = r.getString(2);
+            if (upgradedFromSegmentId != null) {
+              upgradedFromSegmentIds.put(id, upgradedFromSegmentId);
+            }
+            return null;
+          }).list();
+        }
+    );
+    return upgradedFromSegmentIds;
+  }
+
+  @Override
+  public Map<String, Set<String>> retrieveUpgradedToSegmentIds(
+      final String dataSource,
+      final Set<String> segmentIds
+  )
+  {
+    if (segmentIds.isEmpty()) {
+      return Collections.emptyMap();
+    }
+
+    final List<String> upgradedFromSegmentIdList = ImmutableList.copyOf(segmentIds);
+    final String sql = StringUtils.format(
+        "SELECT id, upgraded_from_segment_id FROM %s WHERE dataSource = :dataSource %s",
+        dbTables.getSegmentsTable(),
+        SqlSegmentsMetadataQuery.getParameterizedInConditionForColumn(
+            "upgraded_from_segment_id",
+            upgradedFromSegmentIdList
+        )
+    );
+    final Map<String, Set<String>> upgradedToSegmentIds = new HashMap<>();
+    retrieveSegmentsById(dataSource, segmentIds)
+        .stream()
+        .map(DataSegment::getId)
+        .map(SegmentId::toString)
+        .forEach(id -> upgradedToSegmentIds.computeIfAbsent(id, k -> new HashSet<>()).add(id));
+    connector.retryWithHandle(
+        handle -> {
+          Query<Map<String, Object>> query = handle.createQuery(sql)
+                                                   .bind("dataSource", dataSource);
+          SqlSegmentsMetadataQuery.bindColumnValuesToQueryWithInCondition(
+              "upgraded_from_segment_id",
+              upgradedFromSegmentIdList,
+              query
+          );
+          return query.map((index, r, ctx) -> {
+            final String upgradedToId = r.getString(1);
+            final String id = r.getString(2);
+            upgradedToSegmentIds.computeIfAbsent(id, k -> new HashSet<>())
+                                .add(upgradedToId);
+            return null;
+          }).list();
+        }
+    );
+    return upgradedToSegmentIds;
+  }
+
   private static class PendingSegmentsRecord
   {
     private final String sequenceName;
diff --git a/server/src/main/java/org/apache/druid/metadata/PendingSegmentRecord.java b/server/src/main/java/org/apache/druid/metadata/PendingSegmentRecord.java
index bfbaad18ef1..f117fe7f28b 100644
--- a/server/src/main/java/org/apache/druid/metadata/PendingSegmentRecord.java
+++ b/server/src/main/java/org/apache/druid/metadata/PendingSegmentRecord.java
@@ -40,7 +40,10 @@ import java.sql.ResultSet;
  * <li>  id -> id (Unique identifier for pending segment) <li/>
  * <li>  sequence_name -> sequenceName (sequence name used for segment allocation) <li/>
  * <li>  sequence_prev_id -> sequencePrevId (previous segment id used for segment allocation) <li/>
- * <li>  upgraded_from_segment_id -> upgradedFromSegmentId (Id of the root segment from which this was upgraded) <li/>
+ * <li>  upgraded_from_segment_id -> upgradedFromSegmentId
+ * (ID of the segment which was upgraded to create the current segment.
+ * If the former was itself created as a result of an upgrade, then this ID
+ * must refer to the original non-upgraded segment in the hierarchy.) <li/>
  * <li>  task_allocator_id -> taskAllocatorId (Associates a task / task group / replica group with the pending segment) <li/>
  * </ul>
  */
diff --git a/server/src/main/java/org/apache/druid/metadata/SQLMetadataConnector.java b/server/src/main/java/org/apache/druid/metadata/SQLMetadataConnector.java
index 2d315d19fc8..dc87b9fc2fd 100644
--- a/server/src/main/java/org/apache/druid/metadata/SQLMetadataConnector.java
+++ b/server/src/main/java/org/apache/druid/metadata/SQLMetadataConnector.java
@@ -587,6 +587,8 @@ public abstract class SQLMetadataConnector implements MetadataStorageConnector
     Map<String, String> columnNameTypes = new HashMap<>();
     columnNameTypes.put("used_status_last_updated", "VARCHAR(255)");
 
+    columnNameTypes.put("upgraded_from_segment_id", "VARCHAR(255)");
+
     if (centralizedDatasourceSchemaConfig.isEnabled()) {
       columnNameTypes.put("schema_fingerprint", "VARCHAR(255)");
       columnNameTypes.put("num_rows", "BIGINT");
@@ -619,6 +621,14 @@ public abstract class SQLMetadataConnector implements MetadataStorageConnector
     }
 
     alterTable(tableName, alterCommands);
+
+    final Set<String> createdIndexSet = getIndexOnTable(tableName);
+    createIndex(
+        tableName,
+        StringUtils.format("idx_%1$s_datasource_upgraded_from_segment_id", tableName),
+        ImmutableList.of("dataSource", "upgraded_from_segment_id"),
+        createdIndexSet
+    );
   }
 
   @Override
diff --git a/server/src/main/java/org/apache/druid/metadata/SqlSegmentsMetadataQuery.java b/server/src/main/java/org/apache/druid/metadata/SqlSegmentsMetadataQuery.java
index f14cc995050..fc1c84a7037 100644
--- a/server/src/main/java/org/apache/druid/metadata/SqlSegmentsMetadataQuery.java
+++ b/server/src/main/java/org/apache/druid/metadata/SqlSegmentsMetadataQuery.java
@@ -286,7 +286,7 @@ public class SqlSegmentsMetadataQuery
     if (includeSchemaInfo) {
       final Query<Map<String, Object>> query = handle.createQuery(
           StringUtils.format(
-              "SELECT payload, used, schema_fingerprint, num_rows FROM %s WHERE dataSource = :dataSource %s",
+              "SELECT payload, used, schema_fingerprint, num_rows, upgraded_from_segment_id FROM %s WHERE dataSource = :dataSource %s",
               dbTables.getSegmentsTable(), getParameterizedInConditionForColumn("id", segmentIds)
           )
       );
@@ -306,7 +306,8 @@ public class SqlSegmentsMetadataQuery
                     null,
                     r.getBoolean(2),
                     schemaFingerprint,
-                    numRows
+                    numRows,
+                    r.getString(5)
                 );
               }
           )
@@ -314,7 +315,7 @@ public class SqlSegmentsMetadataQuery
     } else {
       final Query<Map<String, Object>> query = handle.createQuery(
           StringUtils.format(
-              "SELECT payload, used FROM %s WHERE dataSource = :dataSource %s",
+              "SELECT payload, used, upgraded_from_segment_id FROM %s WHERE dataSource = :dataSource %s",
               dbTables.getSegmentsTable(), getParameterizedInConditionForColumn("id", segmentIds)
           )
       );
@@ -331,7 +332,8 @@ public class SqlSegmentsMetadataQuery
                   null,
                   r.getBoolean(2),
                   null,
-                  null
+                  null,
+                  r.getString(3)
               )
           )
           .iterator();
@@ -864,6 +866,7 @@ public class SqlSegmentsMetadataQuery
             DateTimes.of(r.getString(3)),
             null,
             null,
+            null,
             null
         ))
         .iterator();
@@ -980,7 +983,7 @@ public class SqlSegmentsMetadataQuery
    *
    * @see #getParameterizedInConditionForColumn(String, List)
    */
-  private static void bindColumnValuesToQueryWithInCondition(
+  static void bindColumnValuesToQueryWithInCondition(
       final String columnName,
       final List<String> values,
       final SQLStatement<?> query
diff --git a/server/src/main/java/org/apache/druid/server/http/DataSegmentPlus.java b/server/src/main/java/org/apache/druid/server/http/DataSegmentPlus.java
index 9841e09a1a7..bfda5cbf3ad 100644
--- a/server/src/main/java/org/apache/druid/server/http/DataSegmentPlus.java
+++ b/server/src/main/java/org/apache/druid/server/http/DataSegmentPlus.java
@@ -36,6 +36,8 @@ import java.util.Objects;
  * <li>{@link DataSegmentPlus#createdDate} - The time when the segment was created.</li>
  * <li>{@link DataSegmentPlus#usedStatusLastUpdatedDate} - The time when the segments
  * used status was last updated.</li>
+ * <li>{@link DataSegmentPlus#upgradedFromSegmentId} - The segment id to which the same load spec originally belonged.
+ * Load specs can be shared as a result of segment version upgrades.</li>
  * </ul>
  * <p>
  * This class closely resembles the row structure of the {@link MetadataStorageTablesConfig#getSegmentsTable()}.
@@ -53,6 +55,9 @@ public class DataSegmentPlus
   private final String schemaFingerprint;
   private final Long numRows;
 
+  @Nullable
+  private final String upgradedFromSegmentId;
+
   @JsonCreator
   public DataSegmentPlus(
       @JsonProperty("dataSegment") final DataSegment dataSegment,
@@ -60,7 +65,8 @@ public class DataSegmentPlus
       @JsonProperty("usedStatusLastUpdatedDate") @Nullable final DateTime usedStatusLastUpdatedDate,
       @JsonProperty("used") @Nullable final Boolean used,
       @JsonProperty("schemaFingerprint") @Nullable final String schemaFingerprint,
-      @JsonProperty("numRows") @Nullable final Long numRows
+      @JsonProperty("numRows") @Nullable final Long numRows,
+      @JsonProperty("upgradedFromSegmentId") @Nullable final String upgradedFromSegmentId
   )
   {
     this.dataSegment = dataSegment;
@@ -69,6 +75,7 @@ public class DataSegmentPlus
     this.used = used;
     this.schemaFingerprint = schemaFingerprint;
     this.numRows = numRows;
+    this.upgradedFromSegmentId = upgradedFromSegmentId;
   }
 
   @Nullable
@@ -112,6 +119,13 @@ public class DataSegmentPlus
     return numRows;
   }
 
+  @Nullable
+  @JsonProperty
+  public String getUpgradedFromSegmentId()
+  {
+    return upgradedFromSegmentId;
+  }
+
   @Override
   public boolean equals(Object o)
   {
@@ -127,7 +141,8 @@ public class DataSegmentPlus
            && Objects.equals(usedStatusLastUpdatedDate, that.getUsedStatusLastUpdatedDate())
            && Objects.equals(used, that.getUsed())
            && Objects.equals(schemaFingerprint, that.getSchemaFingerprint())
-           && Objects.equals(numRows, that.getNumRows());
+           && Objects.equals(numRows, that.getNumRows())
+           && Objects.equals(upgradedFromSegmentId, that.getUpgradedFromSegmentId());
   }
 
   @Override
@@ -139,7 +154,8 @@ public class DataSegmentPlus
         usedStatusLastUpdatedDate,
         used,
         schemaFingerprint,
-        numRows
+        numRows,
+        upgradedFromSegmentId
     );
   }
 
@@ -153,6 +169,7 @@ public class DataSegmentPlus
            ", used=" + getUsed() +
            ", schemaFingerprint=" + getSchemaFingerprint() +
            ", numRows=" + getNumRows() +
+           ", upgradedFromSegmentId=" + getUpgradedFromSegmentId() +
            '}';
   }
 }
diff --git a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
index 222c1ece89f..f352d5e2609 100644
--- a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
+++ b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
@@ -138,8 +138,10 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
     final String v1 = "2023-01-01";
     final String v2 = "2023-01-02";
     final String v3 = "2023-01-03";
+    final String alreadyUpgradedVersion = "2023-02-01";
     final String lockVersion = "2024-01-01";
 
+    final String taskAllocatorId = "appendTask";
     final String replaceTaskId = "replaceTask1";
     final ReplaceTaskLock replaceLock = new ReplaceTaskLock(
         replaceTaskId,
@@ -148,6 +150,7 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
     );
 
     final Set<DataSegment> appendSegments = new HashSet<>();
+    final List<PendingSegmentRecord> pendingSegmentsForTask = new ArrayList<>();
     final Set<DataSegment> expectedSegmentsToUpgrade = new HashSet<>();
     for (int i = 0; i < 10; i++) {
       final DataSegment segment = createSegment(
@@ -157,6 +160,31 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
       );
       appendSegments.add(segment);
       expectedSegmentsToUpgrade.add(segment);
+      // Add the same segment
+      pendingSegmentsForTask.add(
+          new PendingSegmentRecord(
+              SegmentIdWithShardSpec.fromDataSegment(segment),
+              v1,
+              segment.getId().toString(),
+              null,
+              taskAllocatorId
+          )
+      );
+      // Add upgraded pending segment
+      pendingSegmentsForTask.add(
+          new PendingSegmentRecord(
+              new SegmentIdWithShardSpec(
+                  DS.WIKI,
+                  Intervals.of("2023-01-01/2023-02-01"),
+                  alreadyUpgradedVersion,
+                  new NumberedShardSpec(i, 0)
+              ),
+              alreadyUpgradedVersion,
+              segment.getId().toString(),
+              segment.getId().toString(),
+              taskAllocatorId
+          )
+      );
     }
 
     for (int i = 0; i < 10; i++) {
@@ -167,6 +195,31 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
       );
       appendSegments.add(segment);
       expectedSegmentsToUpgrade.add(segment);
+      // Add the same segment
+      pendingSegmentsForTask.add(
+          new PendingSegmentRecord(
+              SegmentIdWithShardSpec.fromDataSegment(segment),
+              v2,
+              segment.getId().toString(),
+              null,
+              taskAllocatorId
+          )
+      );
+      // Add upgraded pending segment
+      pendingSegmentsForTask.add(
+          new PendingSegmentRecord(
+              new SegmentIdWithShardSpec(
+                  DS.WIKI,
+                  Intervals.of("2023-01-01/2023-02-01"),
+                  alreadyUpgradedVersion,
+                  new NumberedShardSpec(10 + i, 0)
+              ),
+              alreadyUpgradedVersion,
+              segment.getId().toString(),
+              segment.getId().toString(),
+              taskAllocatorId
+          )
+      );
     }
 
     for (int i = 0; i < 10; i++) {
@@ -176,23 +229,78 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
           new LinearShardSpec(i)
       );
       appendSegments.add(segment);
+      // Add the same segment
+      pendingSegmentsForTask.add(
+          new PendingSegmentRecord(
+              SegmentIdWithShardSpec.fromDataSegment(segment),
+              v3,
+              segment.getId().toString(),
+              null,
+              taskAllocatorId
+          )
+      );
+      // Add upgraded pending segment
+      pendingSegmentsForTask.add(
+          new PendingSegmentRecord(
+              new SegmentIdWithShardSpec(
+                  DS.WIKI,
+                  Intervals.of("2023-01-01/2023-02-01"),
+                  alreadyUpgradedVersion,
+                  new NumberedShardSpec(20 + i, 0)
+              ),
+              alreadyUpgradedVersion,
+              segment.getId().toString(),
+              segment.getId().toString(),
+              taskAllocatorId
+          )
+      );
     }
 
+    derbyConnector.retryWithHandle(
+        handle -> coordinator.insertPendingSegmentsIntoMetastore(handle, pendingSegmentsForTask, DS.WIKI, false)
+    );
+
     final Map<DataSegment, ReplaceTaskLock> segmentToReplaceLock
         = expectedSegmentsToUpgrade.stream()
                                    .collect(Collectors.toMap(s -> s, s -> replaceLock));
 
     // Commit the segment and verify the results
     SegmentPublishResult commitResult
-        = coordinator.commitAppendSegments(appendSegments, segmentToReplaceLock, "append", null);
+        = coordinator.commitAppendSegments(appendSegments, segmentToReplaceLock, taskAllocatorId, null);
     Assert.assertTrue(commitResult.isSuccess());
-    Assert.assertEquals(appendSegments, commitResult.getSegments());
 
-    // Verify the segments present in the metadata store
-    Assert.assertEquals(
-        appendSegments,
-        ImmutableSet.copyOf(retrieveUsedSegments(derbyConnectorRule.metadataTablesConfigSupplier().get()))
+    Set<DataSegment> allCommittedSegments
+        = new HashSet<>(retrieveUsedSegments(derbyConnectorRule.metadataTablesConfigSupplier().get()));
+    Map<String, String> upgradedFromSegmentIdMap = coordinator.retrieveUpgradedFromSegmentIds(
+        DS.WIKI,
+        allCommittedSegments.stream().map(DataSegment::getId).map(SegmentId::toString).collect(Collectors.toSet())
     );
+    // Verify the segments present in the metadata store
+    Assert.assertTrue(allCommittedSegments.containsAll(appendSegments));
+    for (DataSegment segment : appendSegments) {
+      Assert.assertNull(upgradedFromSegmentIdMap.get(segment.getId().toString()));
+    }
+    allCommittedSegments.removeAll(appendSegments);
+
+    // Verify the commit of upgraded pending segments
+    Assert.assertEquals(appendSegments.size(), allCommittedSegments.size());
+    Map<String, DataSegment> segmentMap = new HashMap<>();
+    for (DataSegment segment : appendSegments) {
+      segmentMap.put(segment.getId().toString(), segment);
+    }
+    for (DataSegment segment : allCommittedSegments) {
+      for (PendingSegmentRecord pendingSegmentRecord : pendingSegmentsForTask) {
+        if (pendingSegmentRecord.getId().asSegmentId().toString().equals(segment.getId().toString())) {
+          DataSegment upgradedFromSegment = segmentMap.get(pendingSegmentRecord.getUpgradedFromSegmentId());
+          Assert.assertNotNull(upgradedFromSegment);
+          Assert.assertEquals(segment.getLoadSpec(), upgradedFromSegment.getLoadSpec());
+          Assert.assertEquals(
+              pendingSegmentRecord.getUpgradedFromSegmentId(),
+              upgradedFromSegmentIdMap.get(segment.getId().toString())
+          );
+        }
+      }
+    }
 
     // Verify entries in the segment task lock table
     final Set<String> expectedUpgradeSegmentIds
@@ -290,12 +398,24 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
         retrieveUsedSegmentIds(derbyConnectorRule.metadataTablesConfigSupplier().get()).size()
     );
 
-    final Set<DataSegment> usedSegments = new HashSet<>(retrieveUsedSegments(derbyConnectorRule.metadataTablesConfigSupplier().get()));
+    final Set<DataSegment> usedSegments
+        = new HashSet<>(retrieveUsedSegments(derbyConnectorRule.metadataTablesConfigSupplier().get()));
+
+    final Map<String, String> upgradedFromSegmentIdMap = coordinator.retrieveUpgradedFromSegmentIds(
+        "foo",
+        usedSegments.stream().map(DataSegment::getId).map(SegmentId::toString).collect(Collectors.toSet())
+    );
 
     Assert.assertTrue(usedSegments.containsAll(segmentsAppendedWithReplaceLock));
+    for (DataSegment appendSegment : segmentsAppendedWithReplaceLock) {
+      Assert.assertNull(upgradedFromSegmentIdMap.get(appendSegment.getId().toString()));
+    }
     usedSegments.removeAll(segmentsAppendedWithReplaceLock);
 
     Assert.assertTrue(usedSegments.containsAll(replacingSegments));
+    for (DataSegment replaceSegment : replacingSegments) {
+      Assert.assertNull(upgradedFromSegmentIdMap.get(replaceSegment.getId().toString()));
+    }
     usedSegments.removeAll(replacingSegments);
 
     Assert.assertEquals(segmentsAppendedWithReplaceLock.size(), usedSegments.size());
@@ -303,6 +423,10 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
       boolean hasBeenCarriedForward = false;
       for (DataSegment appendedSegment : segmentsAppendedWithReplaceLock) {
         if (appendedSegment.getLoadSpec().equals(segmentReplicaWithNewVersion.getLoadSpec())) {
+          Assert.assertEquals(
+              appendedSegment.getId().toString(),
+              upgradedFromSegmentIdMap.get(segmentReplicaWithNewVersion.getId().toString())
+          );
           hasBeenCarriedForward = true;
           break;
         }
@@ -3300,4 +3424,63 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
         unusedSegmentIdsForIntervalAndVersion.get(0)
     );
   }
+
+  @Test
+  public void testRetrieveUpgradedFromSegmentIds()
+  {
+    final String datasource = defaultSegment.getDataSource();
+    final Map<String, String> upgradedFromSegmentIdMap = new HashMap<>();
+    upgradedFromSegmentIdMap.put(defaultSegment2.getId().toString(), defaultSegment.getId().toString());
+    insertUsedSegments(ImmutableSet.of(defaultSegment, defaultSegment2), upgradedFromSegmentIdMap);
+    coordinator.markSegmentsAsUnusedWithinInterval(datasource, Intervals.ETERNITY);
+    upgradedFromSegmentIdMap.clear();
+    upgradedFromSegmentIdMap.put(defaultSegment3.getId().toString(), defaultSegment.getId().toString());
+    insertUsedSegments(ImmutableSet.of(defaultSegment3, defaultSegment4), upgradedFromSegmentIdMap);
+
+    Map<String, String> expected = new HashMap<>();
+    expected.put(defaultSegment2.getId().toString(), defaultSegment.getId().toString());
+    expected.put(defaultSegment3.getId().toString(), defaultSegment.getId().toString());
+
+    Set<String> segmentIds = new HashSet<>();
+    segmentIds.add(defaultSegment.getId().toString());
+    segmentIds.add(defaultSegment2.getId().toString());
+    segmentIds.add(defaultSegment3.getId().toString());
+    segmentIds.add(defaultSegment4.getId().toString());
+    Assert.assertEquals(
+        expected,
+        coordinator.retrieveUpgradedFromSegmentIds(datasource, segmentIds)
+    );
+  }
+
+  @Test
+  public void testRetrieveUpgradedToSegmentIds()
+  {
+    final String datasource = defaultSegment.getDataSource();
+    final Map<String, String> upgradedFromSegmentIdMap = new HashMap<>();
+    upgradedFromSegmentIdMap.put(defaultSegment2.getId().toString(), defaultSegment.getId().toString());
+    insertUsedSegments(ImmutableSet.of(defaultSegment, defaultSegment2), upgradedFromSegmentIdMap);
+    coordinator.markSegmentsAsUnusedWithinInterval(datasource, Intervals.ETERNITY);
+    upgradedFromSegmentIdMap.clear();
+    upgradedFromSegmentIdMap.put(defaultSegment3.getId().toString(), defaultSegment.getId().toString());
+    insertUsedSegments(ImmutableSet.of(defaultSegment3, defaultSegment4), upgradedFromSegmentIdMap);
+
+    Map<String, Set<String>> expected = new HashMap<>();
+    expected.put(defaultSegment.getId().toString(), new HashSet<>());
+    expected.get(defaultSegment.getId().toString()).add(defaultSegment.getId().toString());
+    expected.get(defaultSegment.getId().toString()).add(defaultSegment2.getId().toString());
+    expected.get(defaultSegment.getId().toString()).add(defaultSegment3.getId().toString());
+
+    Set<String> upgradedIds = new HashSet<>();
+    upgradedIds.add(defaultSegment.getId().toString());
+    Assert.assertEquals(
+        expected,
+        coordinator.retrieveUpgradedToSegmentIds(datasource, upgradedIds)
+    );
+  }
+
+  private void insertUsedSegments(Set<DataSegment> segments, Map<String, String> upgradedFromSegmentIdMap)
+  {
+    final String table = derbyConnectorRule.metadataTablesConfigSupplier().get().getSegmentsTable();
+    insertUsedSegments(segments, upgradedFromSegmentIdMap, derbyConnector, table, mapper);
+  }
 }
diff --git a/server/src/test/java/org/apache/druid/metadata/IndexerSqlMetadataStorageCoordinatorTestBase.java b/server/src/test/java/org/apache/druid/metadata/IndexerSqlMetadataStorageCoordinatorTestBase.java
index ce0e0686058..2076e5ffa46 100644
--- a/server/src/test/java/org/apache/druid/metadata/IndexerSqlMetadataStorageCoordinatorTestBase.java
+++ b/server/src/test/java/org/apache/druid/metadata/IndexerSqlMetadataStorageCoordinatorTestBase.java
@@ -58,6 +58,7 @@ import java.util.HashMap;
 import java.util.HashSet;
 import java.util.List;
 import java.util.Map;
+import java.util.Objects;
 import java.util.Set;
 import java.util.concurrent.atomic.AtomicLong;
 import java.util.function.Function;
@@ -322,6 +323,8 @@ public class IndexerSqlMetadataStorageCoordinatorTestBase
                       .version(version)
                       .shardSpec(shardSpec)
                       .size(100)
+                      // hash to get a unique load spec as segmentId has not yet been generated
+                      .loadSpec(ImmutableMap.of("hash", Objects.hash(interval, version, shardSpec)))
                       .build();
   }
 
@@ -559,4 +562,50 @@ public class IndexerSqlMetadataStorageCoordinatorTestBase
         }
     );
   }
+
+  public static void insertUsedSegments(
+      Set<DataSegment> dataSegments,
+      Map<String, String> upgradedFromSegmentIdMap,
+      SQLMetadataConnector connector,
+      String table,
+      ObjectMapper jsonMapper
+  )
+  {
+    connector.retryWithHandle(
+        handle -> {
+          PreparedBatch preparedBatch = handle.prepareBatch(
+              StringUtils.format(
+                  "INSERT INTO %1$s (id, dataSource, created_date, start, %2$send%2$s, partitioned, version,"
+                  + " used, payload, used_status_last_updated, upgraded_from_segment_id) "
+                  + "VALUES (:id, :dataSource, :created_date, :start, :end, :partitioned, :version,"
+                  + " :used, :payload, :used_status_last_updated, :upgraded_from_segment_id)",
+                  table,
+                  connector.getQuoteString()
+              )
+          );
+          for (DataSegment segment : dataSegments) {
+            String id = segment.getId().toString();
+            preparedBatch.add()
+                         .bind("id", id)
+                         .bind("dataSource", segment.getDataSource())
+                         .bind("created_date", DateTimes.nowUtc().toString())
+                         .bind("start", segment.getInterval().getStart().toString())
+                         .bind("end", segment.getInterval().getEnd().toString())
+                         .bind("partitioned", !(segment.getShardSpec() instanceof NoneShardSpec))
+                         .bind("version", segment.getVersion())
+                         .bind("used", true)
+                         .bind("payload", jsonMapper.writeValueAsBytes(segment))
+                         .bind("used_status_last_updated", DateTimes.nowUtc().toString())
+                         .bind("upgraded_from_segment_id", upgradedFromSegmentIdMap.get(segment.getId().toString()));
+          }
+
+          final int[] affectedRows = preparedBatch.execute();
+          final boolean succeeded = Arrays.stream(affectedRows).allMatch(eachAffectedRows -> eachAffectedRows == 1);
+          if (!succeeded) {
+            throw new ISE("Failed to publish segments to DB");
+          }
+          return true;
+        }
+    );
+  }
 }
diff --git a/server/src/test/java/org/apache/druid/server/http/DataSegmentPlusTest.java b/server/src/test/java/org/apache/druid/server/http/DataSegmentPlusTest.java
index 0f20fc96bdc..b963f433708 100644
--- a/server/src/test/java/org/apache/druid/server/http/DataSegmentPlusTest.java
+++ b/server/src/test/java/org/apache/druid/server/http/DataSegmentPlusTest.java
@@ -100,6 +100,7 @@ public class DataSegmentPlusTest
         usedStatusLastUpdatedDate,
         null,
         null,
+        null,
         null
     );
 
@@ -108,7 +109,7 @@ public class DataSegmentPlusTest
         JacksonUtils.TYPE_REFERENCE_MAP_STRING_OBJECT
     );
 
-    Assert.assertEquals(6, objectMap.size());
+    Assert.assertEquals(7, objectMap.size());
     final Map<String, Object> segmentObjectMap = MAPPER.readValue(
         MAPPER.writeValueAsString(segmentPlus.getDataSegment()),
         JacksonUtils.TYPE_REFERENCE_MAP_STRING_OBJECT
diff --git a/server/src/test/java/org/apache/druid/server/http/MetadataResourceTest.java b/server/src/test/java/org/apache/druid/server/http/MetadataResourceTest.java
index 4d6bbf5929b..9c52d639300 100644
--- a/server/src/test/java/org/apache/druid/server/http/MetadataResourceTest.java
+++ b/server/src/test/java/org/apache/druid/server/http/MetadataResourceTest.java
@@ -77,7 +77,7 @@ public class MetadataResourceTest
           .toArray(new DataSegment[0]);
 
   private final List<DataSegmentPlus> segmentsPlus = Arrays.stream(segments)
-          .map(s -> new DataSegmentPlus(s, DateTimes.nowUtc(), DateTimes.nowUtc(), null, null, null))
+          .map(s -> new DataSegmentPlus(s, DateTimes.nowUtc(), DateTimes.nowUtc(), null, null, null, null))
           .collect(Collectors.toList());
   private HttpServletRequest request;
   private SegmentsMetadataManager segmentsMetadataManager;

From 209f8a95468e8450e3d1365d7f0eda98a35732df Mon Sep 17 00:00:00 2001
From: Laksh Singla <lakshsingla@gmail.com>
Date: Mon, 15 Jul 2024 15:00:17 +0530
Subject: [PATCH 67/72] Deserialize complex dimensions in group by queries to
 their respective types when reading from spilled files and cached results
 (#16620)

Like #16511, but for keys that have been spilled or cached during the grouping process
---
 .../druid/jackson/AggregatorsModule.java      |  15 +-
 .../apache/druid/query/QueryToolChest.java    |  21 ++-
 .../DataSourceQueryQueryToolChest.java        |   8 +
 .../groupby/GroupByQueryQueryToolChest.java   | 102 +++++++----
 .../query/groupby/epinephelinae/Grouper.java  |  11 ++
 .../epinephelinae/RowBasedGrouperHelper.java  | 135 ++++++++++++--
 .../epinephelinae/RowBasedKeySerdeHelper.java |   5 +
 .../epinephelinae/SpillingGrouper.java        |   2 +-
 .../SegmentMetadataQueryQueryToolChest.java   |  11 ++
 .../search/SearchQueryQueryToolChest.java     |  10 ++
 .../TimeBoundaryQueryQueryToolChest.java      |  12 ++
 .../TimeseriesQueryQueryToolChest.java        |  12 ++
 .../query/topn/TopNQueryQueryToolChest.java   |  13 +-
 .../ObjectStrategyComplexTypeStrategy.java    |   6 +-
 .../druid/segment/column/TypeStrategies.java  |  30 ++++
 .../druid/segment/column/TypeStrategy.java    |   2 +-
 .../aggregation/AggregationTestHelper.java    |   8 +-
 .../ComplexDimensionGroupByQueryTest.java     | 164 ++++++++++++++++++
 .../GroupByQueryQueryToolChestTest.java       |  94 ++++++++--
 .../query/groupby/GroupByQueryRunnerTest.java |   5 +-
 .../druid/client/CachingClusteredClient.java  |   2 +-
 .../druid/client/CachingQueryRunner.java      |   2 +-
 .../query/ResultLevelCachingQueryRunner.java  |   2 +-
 .../druid/client/CachingQueryRunnerTest.java  |  15 +-
 24 files changed, 592 insertions(+), 95 deletions(-)
 create mode 100644 processing/src/test/java/org/apache/druid/query/groupby/ComplexDimensionGroupByQueryTest.java

diff --git a/processing/src/main/java/org/apache/druid/jackson/AggregatorsModule.java b/processing/src/main/java/org/apache/druid/jackson/AggregatorsModule.java
index f7aca511e17..200e6fcb139 100644
--- a/processing/src/main/java/org/apache/druid/jackson/AggregatorsModule.java
+++ b/processing/src/main/java/org/apache/druid/jackson/AggregatorsModule.java
@@ -83,6 +83,16 @@ public class AggregatorsModule extends SimpleModule
   {
     super("AggregatorFactories");
 
+    registerComplexMetricsAndSerde();
+
+    setMixInAnnotation(AggregatorFactory.class, AggregatorFactoryMixin.class);
+    setMixInAnnotation(PostAggregator.class, PostAggregatorMixin.class);
+
+    addSerializer(DoubleMeanHolder.class, DoubleMeanHolder.Serializer.INSTANCE);
+  }
+
+  public static void registerComplexMetricsAndSerde()
+  {
     ComplexMetrics.registerSerde(HyperUniquesSerde.TYPE_NAME, new HyperUniquesSerde());
     ComplexMetrics.registerSerde(PreComputedHyperUniquesSerde.TYPE_NAME, new PreComputedHyperUniquesSerde());
     ComplexMetrics.registerSerde(
@@ -102,11 +112,6 @@ public class AggregatorsModule extends SimpleModule
         SerializablePairLongLongComplexMetricSerde.TYPE_NAME,
         new SerializablePairLongLongComplexMetricSerde()
     );
-
-    setMixInAnnotation(AggregatorFactory.class, AggregatorFactoryMixin.class);
-    setMixInAnnotation(PostAggregator.class, PostAggregatorMixin.class);
-
-    addSerializer(DoubleMeanHolder.class, DoubleMeanHolder.Serializer.INSTANCE);
   }
 
   @JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type")
diff --git a/processing/src/main/java/org/apache/druid/query/QueryToolChest.java b/processing/src/main/java/org/apache/druid/query/QueryToolChest.java
index b0678f247c9..fa394beec43 100644
--- a/processing/src/main/java/org/apache/druid/query/QueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/QueryToolChest.java
@@ -251,19 +251,36 @@ public abstract class QueryToolChest<ResultType, QueryType extends Query<ResultT
    */
   public abstract TypeReference<ResultType> getResultTypeReference();
 
+  /**
+   * Like {@link #getCacheStrategy(Query, ObjectMapper)} but the caller doesn't supply the object mapper for deserializing
+   * and converting the cached data to desired type. It's upto the individual implementations to decide the appropriate action in that case.
+   * It can either throw an exception outright or decide if the query requires the object mapper for proper downstream processing and
+   * work with the generic java types if not.
+   * <p>
+   * @deprecated Use {@link #getCacheStrategy(Query, ObjectMapper)} instead
+   */
+  @Deprecated
+  @Nullable
+  public <T> CacheStrategy<ResultType, T, QueryType> getCacheStrategy(QueryType query)
+  {
+    return null;
+  }
+
   /**
    * Returns a CacheStrategy to be used to load data into the cache and remove it from the cache.
    * <p>
    * This is optional.  If it returns null, caching is effectively disabled for the query.
    *
    * @param query The query whose results might be cached
+   * @param mapper Object mapper to convert the deserialized generic java objects to desired types. It can be nullable
+   *               to preserve backward compatibility.
    * @param <T>   The type of object that will be stored in the cache
    * @return A CacheStrategy that can be used to populate and read from the Cache
    */
   @Nullable
-  public <T> CacheStrategy<ResultType, T, QueryType> getCacheStrategy(QueryType query)
+  public <T> CacheStrategy<ResultType, T, QueryType> getCacheStrategy(QueryType query, @Nullable ObjectMapper mapper)
   {
-    return null;
+    return getCacheStrategy(query);
   }
 
   /**
diff --git a/processing/src/main/java/org/apache/druid/query/datasourcemetadata/DataSourceQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/datasourcemetadata/DataSourceQueryQueryToolChest.java
index dbe8922f2e9..21fb5c53afc 100644
--- a/processing/src/main/java/org/apache/druid/query/datasourcemetadata/DataSourceQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/datasourcemetadata/DataSourceQueryQueryToolChest.java
@@ -20,6 +20,7 @@
 package org.apache.druid.query.datasourcemetadata;
 
 import com.fasterxml.jackson.core.type.TypeReference;
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.base.Function;
 import com.google.common.base.Functions;
 import com.google.inject.Inject;
@@ -38,6 +39,7 @@ import org.apache.druid.query.aggregation.MetricManipulationFn;
 import org.apache.druid.query.context.ResponseContext;
 import org.apache.druid.timeline.LogicalSegment;
 
+import javax.annotation.Nullable;
 import java.util.List;
 import java.util.stream.Collectors;
 
@@ -119,4 +121,10 @@ public class DataSourceQueryQueryToolChest
   {
     return null;
   }
+
+  @Override
+  public CacheStrategy getCacheStrategy(DataSourceMetadataQuery query, @Nullable ObjectMapper mapper)
+  {
+    return null;
+  }
 }
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java
index b19b479c26d..d69e09c9ff0 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChest.java
@@ -77,8 +77,10 @@ import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.NullableTypeStrategy;
 import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.segment.column.ValueType;
+import org.apache.druid.segment.nested.StructuredData;
 import org.joda.time.DateTime;
 
+import javax.annotation.Nullable;
 import java.io.Closeable;
 import java.io.IOException;
 import java.util.ArrayList;
@@ -471,7 +473,7 @@ public class GroupByQueryQueryToolChest extends QueryToolChest<ResultRow, GroupB
     // Deserializer that can deserialize either array- or map-based rows.
     final JsonDeserializer<ResultRow> deserializer = new JsonDeserializer<ResultRow>()
     {
-      final Class<?>[] dimensionClasses = createDimensionClasses();
+      final Class<?>[] dimensionClasses = createDimensionClasses(query);
       boolean containsComplexDimensions = query.getDimensions()
                                                .stream()
                                                .anyMatch(
@@ -524,30 +526,6 @@ public class GroupByQueryQueryToolChest extends QueryToolChest<ResultRow, GroupB
           return ResultRow.of(objectArray);
         }
       }
-
-      private Class<?>[] createDimensionClasses()
-      {
-        final List<DimensionSpec> queryDimensions = query.getDimensions();
-        final Class<?>[] classes = new Class[queryDimensions.size()];
-        for (int i = 0; i < queryDimensions.size(); ++i) {
-          final ColumnType dimensionOutputType = queryDimensions.get(i).getOutputType();
-          if (dimensionOutputType.is(ValueType.COMPLEX)) {
-            NullableTypeStrategy nullableTypeStrategy = dimensionOutputType.getNullableStrategy();
-            if (!nullableTypeStrategy.groupable()) {
-              throw DruidException.defensive(
-                  "Ungroupable dimension [%s] with type [%s] found in the query.",
-                  queryDimensions.get(i).getDimension(),
-                  dimensionOutputType
-              );
-            }
-            classes[i] = nullableTypeStrategy.getClazz();
-          } else {
-            classes[i] = Object.class;
-          }
-        }
-        return classes;
-      }
-
     };
 
     class GroupByResultRowModule extends SimpleModule
@@ -597,9 +575,32 @@ public class GroupByQueryQueryToolChest extends QueryToolChest<ResultRow, GroupB
     );
   }
 
+  @Nullable
   @Override
-  public CacheStrategy<ResultRow, Object, GroupByQuery> getCacheStrategy(final GroupByQuery query)
+  public CacheStrategy<ResultRow, Object, GroupByQuery> getCacheStrategy(GroupByQuery query)
   {
+    return getCacheStrategy(query, null);
+  }
+
+  @Override
+  public CacheStrategy<ResultRow, Object, GroupByQuery> getCacheStrategy(
+      final GroupByQuery query,
+      @Nullable final ObjectMapper mapper
+  )
+  {
+
+    for (DimensionSpec dimension : query.getDimensions()) {
+      if (dimension.getOutputType().is(ValueType.COMPLEX) && !dimension.getOutputType().equals(ColumnType.NESTED_DATA)) {
+        if (mapper == null) {
+          throw DruidException.defensive(
+              "Cannot deserialize complex dimension of type[%s] from result cache if object mapper is not provided",
+              dimension.getOutputType().getComplexTypeName()
+          );
+        }
+      }
+    }
+    final Class<?>[] dimensionClasses = createDimensionClasses(query);
+
     return new CacheStrategy<ResultRow, Object, GroupByQuery>()
     {
       private static final byte CACHE_STRATEGY_VERSION = 0x1;
@@ -726,13 +727,29 @@ public class GroupByQueryQueryToolChest extends QueryToolChest<ResultRow, GroupB
             int dimPos = 0;
             while (dimsIter.hasNext() && results.hasNext()) {
               final DimensionSpec dimensionSpec = dimsIter.next();
+              final Object dimensionObject = results.next();
+              final Object dimensionObjectCasted;
 
-              // Must convert generic Jackson-deserialized type into the proper type.
-              resultRow.set(
-                  dimensionStart + dimPos,
-                  DimensionHandlerUtils.convertObjectToType(results.next(), dimensionSpec.getOutputType())
-              );
+              final ColumnType outputType = dimensionSpec.getOutputType();
 
+              // Must convert generic Jackson-deserialized type into the proper type. The downstream functions expect the
+              // dimensions to be of appropriate types for further processing like merging and comparing.
+              if (outputType.is(ValueType.COMPLEX)) {
+                // Json columns can interpret generic data objects appropriately, hence they are wrapped as is in StructuredData.
+                // They don't need to converted them from Object.class to StructuredData.class using object mapper as that is an
+                // expensive operation that will be wasteful.
+                if (outputType.equals(ColumnType.NESTED_DATA)) {
+                  dimensionObjectCasted = StructuredData.wrap(dimensionObject);
+                } else {
+                  dimensionObjectCasted = mapper.convertValue(dimensionObject, dimensionClasses[dimPos]);
+                }
+              } else {
+                dimensionObjectCasted = DimensionHandlerUtils.convertObjectToType(
+                    dimensionObject,
+                    dimensionSpec.getOutputType()
+                );
+              }
+              resultRow.set(dimensionStart + dimPos, dimensionObjectCasted);
               dimPos++;
             }
 
@@ -861,4 +878,27 @@ public class GroupByQueryQueryToolChest extends QueryToolChest<ResultRow, GroupB
 
     return retVal;
   }
+
+  private static Class<?>[] createDimensionClasses(final GroupByQuery query)
+  {
+    final List<DimensionSpec> queryDimensions = query.getDimensions();
+    final Class<?>[] classes = new Class[queryDimensions.size()];
+    for (int i = 0; i < queryDimensions.size(); ++i) {
+      final ColumnType dimensionOutputType = queryDimensions.get(i).getOutputType();
+      if (dimensionOutputType.is(ValueType.COMPLEX)) {
+        NullableTypeStrategy nullableTypeStrategy = dimensionOutputType.getNullableStrategy();
+        if (!nullableTypeStrategy.groupable()) {
+          throw DruidException.defensive(
+              "Ungroupable dimension [%s] with type [%s] found in the query.",
+              queryDimensions.get(i).getDimension(),
+              dimensionOutputType
+          );
+        }
+        classes[i] = nullableTypeStrategy.getClazz();
+      } else {
+        classes[i] = Object.class;
+      }
+    }
+    return classes;
+  }
 }
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/Grouper.java b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/Grouper.java
index 591624f1ab8..0f3faedb707 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/Grouper.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/Grouper.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.query.groupby.epinephelinae;
 
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.base.Preconditions;
 import org.apache.druid.java.util.common.parsers.CloseableIterator;
 import org.apache.druid.query.aggregation.AggregatorFactory;
@@ -232,6 +233,16 @@ public interface Grouper<KeyType> extends Closeable
      */
     BufferComparator bufferComparatorWithAggregators(AggregatorFactory[] aggregatorFactories, int[] aggregatorOffsets);
 
+    /**
+     * Decorates the object mapper enabling it to read and write query results' grouping keys. It is used by the
+     * {@link SpillingGrouper} to preserve the types of the dimensions after serializing and deserializing them on the
+     * spilled files.
+     */
+    default ObjectMapper decorateObjectMapper(ObjectMapper spillMapper)
+    {
+      return spillMapper;
+    }
+
     /**
      * Reset the keySerde to its initial state. After this method is called, {@link #readFromByteBuffer}
      * and {@link #bufferComparator()} may no longer work properly on previously-serialized keys.
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/RowBasedGrouperHelper.java b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/RowBasedGrouperHelper.java
index 491c28d4142..da8a0e04623 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/RowBasedGrouperHelper.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/RowBasedGrouperHelper.java
@@ -19,9 +19,14 @@
 
 package org.apache.druid.query.groupby.epinephelinae;
 
-import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonValue;
+import com.fasterxml.jackson.core.JsonParser;
+import com.fasterxml.jackson.core.JsonToken;
+import com.fasterxml.jackson.core.ObjectCodec;
+import com.fasterxml.jackson.databind.DeserializationContext;
+import com.fasterxml.jackson.databind.JsonDeserializer;
 import com.fasterxml.jackson.databind.ObjectMapper;
+import com.fasterxml.jackson.databind.module.SimpleModule;
 import com.google.common.base.Preconditions;
 import com.google.common.base.Supplier;
 import com.google.common.primitives.Ints;
@@ -84,6 +89,7 @@ import org.joda.time.Interval;
 
 import javax.annotation.Nullable;
 import java.io.Closeable;
+import java.io.IOException;
 import java.nio.ByteBuffer;
 import java.util.ArrayList;
 import java.util.Arrays;
@@ -666,22 +672,6 @@ public class RowBasedGrouperHelper
       this.key = key;
     }
 
-    @JsonCreator
-    public static RowBasedKey fromJsonArray(final Object[] key)
-    {
-      // Type info is lost during serde:
-      // Floats may be deserialized as doubles, Longs may be deserialized as integers, convert them back
-      for (int i = 0; i < key.length; i++) {
-        if (key[i] instanceof Integer) {
-          key[i] = ((Integer) key[i]).longValue();
-        } else if (key[i] instanceof Double) {
-          key[i] = ((Double) key[i]).floatValue();
-        }
-      }
-
-      return new RowBasedKey(key);
-    }
-
     @JsonValue
     public Object[] getKey()
     {
@@ -1371,6 +1361,65 @@ public class RowBasedGrouperHelper
       );
     }
 
+    @Override
+    public ObjectMapper decorateObjectMapper(ObjectMapper spillMapper)
+    {
+
+      final JsonDeserializer<RowBasedKey> deserializer = new JsonDeserializer<RowBasedKey>()
+      {
+        @Override
+        public RowBasedKey deserialize(
+            JsonParser jp,
+            DeserializationContext deserializationContext
+        ) throws IOException
+        {
+          if (!jp.isExpectedStartArrayToken()) {
+            throw DruidException.defensive("Expected array start token, received [%s]", jp.getCurrentToken());
+          }
+          jp.nextToken();
+
+          final ObjectCodec codec = jp.getCodec();
+          final int timestampAdjustment = includeTimestamp ? 1 : 0;
+          final int dimsToRead = timestampAdjustment + serdeHelpers.length;
+          int dimsReadSoFar = 0;
+          final Object[] objects = new Object[dimsToRead];
+
+          if (includeTimestamp) {
+            DruidException.conditionalDefensive(
+                jp.currentToken() != JsonToken.END_ARRAY,
+                "Unexpected end of array when deserializing timestamp from the spilled files"
+            );
+            objects[dimsReadSoFar] = codec.readValue(jp, Long.class);
+
+            ++dimsReadSoFar;
+            jp.nextToken();
+          }
+
+          while (jp.currentToken() != JsonToken.END_ARRAY) {
+            objects[dimsReadSoFar] =
+                codec.readValue(jp, serdeHelpers[dimsReadSoFar - timestampAdjustment].getClazz());
+
+            ++dimsReadSoFar;
+            jp.nextToken();
+          }
+
+          return new RowBasedKey(objects);
+        }
+      };
+
+      class SpillModule extends SimpleModule
+      {
+        public SpillModule()
+        {
+          addDeserializer(RowBasedKey.class, deserializer);
+        }
+      }
+
+      final ObjectMapper newObjectMapper = spillMapper.copy();
+      newObjectMapper.registerModule(new SpillModule());
+      return newObjectMapper;
+    }
+
     @Override
     public void reset()
     {
@@ -1588,6 +1637,7 @@ public class RowBasedGrouperHelper
     {
       final BufferComparator bufferComparator;
       final String columnTypeName;
+      final Class<?> clazz;
 
       final List<Object> dictionary;
       final Object2IntMap<Object> reverseDictionary;
@@ -1613,6 +1663,7 @@ public class RowBasedGrouperHelper
                 dictionary.get(lhsBuffer.getInt(lhsPosition + keyBufferPosition)),
                 dictionary.get(rhsBuffer.getInt(rhsPosition + keyBufferPosition))
             );
+        clazz = columnType.getNullableStrategy().getClazz();
       }
 
       // Asserts that we don't entertain any complex types without a typename, to prevent intermixing dictionaries of
@@ -1645,6 +1696,12 @@ public class RowBasedGrouperHelper
       {
         return reverseDictionary;
       }
+
+      @Override
+      public Class<?> getClazz()
+      {
+        return clazz;
+      }
     }
 
 
@@ -1726,6 +1783,14 @@ public class RowBasedGrouperHelper
       {
         return reverseDictionary;
       }
+
+      @Override
+      public Class<?> getClazz()
+      {
+        // Jackson deserializes Object[] containing longs to Object[] containing string if Object[].class is returned
+        // Therefore we are using Object.class
+        return Object.class;
+      }
     }
 
     private class ArrayStringRowBasedKeySerdeHelper extends DictionaryBuildingSingleValuedRowBasedKeySerdeHelper
@@ -1770,6 +1835,12 @@ public class RowBasedGrouperHelper
       {
         return reverseStringArrayDictionary;
       }
+
+      @Override
+      public Class<?> getClazz()
+      {
+        return Object[].class;
+      }
     }
 
     private abstract class AbstractStringRowBasedKeySerdeHelper implements RowBasedKeySerdeHelper
@@ -1819,6 +1890,12 @@ public class RowBasedGrouperHelper
       {
         return bufferComparator;
       }
+
+      @Override
+      public Class<?> getClazz()
+      {
+        return String.class;
+      }
     }
 
     private class DynamicDictionaryStringRowBasedKeySerdeHelper extends AbstractStringRowBasedKeySerdeHelper
@@ -1937,6 +2014,12 @@ public class RowBasedGrouperHelper
       {
         return bufferComparator;
       }
+
+      @Override
+      public Class<?> getClazz()
+      {
+        return Long.class;
+      }
     }
 
     private class FloatRowBasedKeySerdeHelper implements RowBasedKeySerdeHelper
@@ -1982,6 +2065,12 @@ public class RowBasedGrouperHelper
       {
         return bufferComparator;
       }
+
+      @Override
+      public Class<?> getClazz()
+      {
+        return Float.class;
+      }
     }
 
     private class DoubleRowBasedKeySerdeHelper implements RowBasedKeySerdeHelper
@@ -2027,6 +2116,12 @@ public class RowBasedGrouperHelper
       {
         return bufferComparator;
       }
+
+      @Override
+      public Class<?> getClazz()
+      {
+        return Double.class;
+      }
     }
 
     // This class is only used when SQL compatible null handling is enabled.
@@ -2082,6 +2177,12 @@ public class RowBasedGrouperHelper
       {
         return comparator;
       }
+
+      @Override
+      public Class<?> getClazz()
+      {
+        return delegate.getClazz();
+      }
     }
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/RowBasedKeySerdeHelper.java b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/RowBasedKeySerdeHelper.java
index 1cb29d23bc0..71372ca238b 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/RowBasedKeySerdeHelper.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/RowBasedKeySerdeHelper.java
@@ -65,4 +65,9 @@ interface RowBasedKeySerdeHelper
    * Return a {@link BufferComparator} to compare keys stored in ByteBuffer.
    */
   BufferComparator getBufferComparator();
+
+  /**
+   * Returns the expected class of the key which used to deserialize the objects correctly from the spilled files.
+   */
+  Class<?> getClazz();
 }
diff --git a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/SpillingGrouper.java b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/SpillingGrouper.java
index 4e9b96102a1..d8a7760c11d 100644
--- a/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/SpillingGrouper.java
+++ b/processing/src/main/java/org/apache/druid/query/groupby/epinephelinae/SpillingGrouper.java
@@ -152,7 +152,7 @@ public class SpillingGrouper<KeyType> implements Grouper<KeyType>
     }
     this.aggregatorFactories = aggregatorFactories;
     this.temporaryStorage = temporaryStorage;
-    this.spillMapper = spillMapper;
+    this.spillMapper = keySerde.decorateObjectMapper(spillMapper);
     this.spillingAllowed = spillingAllowed;
     this.sortHasNonGroupingFields = sortHasNonGroupingFields;
   }
diff --git a/processing/src/main/java/org/apache/druid/query/metadata/SegmentMetadataQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/metadata/SegmentMetadataQueryQueryToolChest.java
index 912ecb1ac32..fd8d7e7009c 100644
--- a/processing/src/main/java/org/apache/druid/query/metadata/SegmentMetadataQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/metadata/SegmentMetadataQueryQueryToolChest.java
@@ -20,6 +20,7 @@
 package org.apache.druid.query.metadata;
 
 import com.fasterxml.jackson.core.type.TypeReference;
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Function;
 import com.google.common.base.Functions;
@@ -62,6 +63,7 @@ import org.apache.druid.utils.CollectionUtils;
 import org.joda.time.DateTime;
 import org.joda.time.Interval;
 
+import javax.annotation.Nullable;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Comparator;
@@ -184,6 +186,15 @@ public class SegmentMetadataQueryQueryToolChest extends QueryToolChest<SegmentAn
 
   @Override
   public CacheStrategy<SegmentAnalysis, SegmentAnalysis, SegmentMetadataQuery> getCacheStrategy(final SegmentMetadataQuery query)
+  {
+    return getCacheStrategy(query, null);
+  }
+
+  @Override
+  public CacheStrategy<SegmentAnalysis, SegmentAnalysis, SegmentMetadataQuery> getCacheStrategy(
+      final SegmentMetadataQuery query,
+      @Nullable final ObjectMapper objectMapper
+  )
   {
     return new CacheStrategy<SegmentAnalysis, SegmentAnalysis, SegmentMetadataQuery>()
     {
diff --git a/processing/src/main/java/org/apache/druid/query/search/SearchQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/search/SearchQueryQueryToolChest.java
index b390cd83a58..c15e1d0d99c 100644
--- a/processing/src/main/java/org/apache/druid/query/search/SearchQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/search/SearchQueryQueryToolChest.java
@@ -20,6 +20,7 @@
 package org.apache.druid.query.search;
 
 import com.fasterxml.jackson.core.type.TypeReference;
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Function;
 import com.google.common.base.Functions;
@@ -124,6 +125,15 @@ public class SearchQueryQueryToolChest extends QueryToolChest<Result<SearchResul
 
   @Override
   public CacheStrategy<Result<SearchResultValue>, Object, SearchQuery> getCacheStrategy(final SearchQuery query)
+  {
+    return getCacheStrategy(query, null);
+  }
+
+  @Override
+  public CacheStrategy<Result<SearchResultValue>, Object, SearchQuery> getCacheStrategy(
+      final SearchQuery query,
+      @Nullable final ObjectMapper objectMapper
+  )
   {
 
     return new CacheStrategy<Result<SearchResultValue>, Object, SearchQuery>()
diff --git a/processing/src/main/java/org/apache/druid/query/timeboundary/TimeBoundaryQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/timeboundary/TimeBoundaryQueryQueryToolChest.java
index 9087dd26a88..eab5e0f5abc 100644
--- a/processing/src/main/java/org/apache/druid/query/timeboundary/TimeBoundaryQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/timeboundary/TimeBoundaryQueryQueryToolChest.java
@@ -20,6 +20,7 @@
 package org.apache.druid.query.timeboundary;
 
 import com.fasterxml.jackson.core.type.TypeReference;
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Function;
 import com.google.common.base.Functions;
@@ -47,6 +48,7 @@ import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.timeline.LogicalSegment;
 
+import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
 import java.util.Comparator;
 import java.util.List;
@@ -163,6 +165,16 @@ public class TimeBoundaryQueryQueryToolChest
 
   @Override
   public CacheStrategy<Result<TimeBoundaryResultValue>, Object, TimeBoundaryQuery> getCacheStrategy(final TimeBoundaryQuery query)
+  {
+    return getCacheStrategy(query, null);
+  }
+
+
+  @Override
+  public CacheStrategy<Result<TimeBoundaryResultValue>, Object, TimeBoundaryQuery> getCacheStrategy(
+      final TimeBoundaryQuery query,
+      @Nullable final ObjectMapper objectMapper
+  )
   {
     return new CacheStrategy<Result<TimeBoundaryResultValue>, Object, TimeBoundaryQuery>()
     {
diff --git a/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java
index 17a2f8be956..67c36fe7603 100644
--- a/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/timeseries/TimeseriesQueryQueryToolChest.java
@@ -20,6 +20,7 @@
 package org.apache.druid.query.timeseries;
 
 import com.fasterxml.jackson.core.type.TypeReference;
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Function;
 import com.google.common.base.Preconditions;
@@ -65,6 +66,7 @@ import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.RowSignature;
 import org.joda.time.DateTime;
 
+import javax.annotation.Nullable;
 import java.io.Closeable;
 import java.util.ArrayList;
 import java.util.Collections;
@@ -276,6 +278,16 @@ public class TimeseriesQueryQueryToolChest extends QueryToolChest<Result<Timeser
 
   @Override
   public CacheStrategy<Result<TimeseriesResultValue>, Object, TimeseriesQuery> getCacheStrategy(final TimeseriesQuery query)
+  {
+    return getCacheStrategy(query, null);
+  }
+
+
+  @Override
+  public CacheStrategy<Result<TimeseriesResultValue>, Object, TimeseriesQuery> getCacheStrategy(
+      final TimeseriesQuery query,
+      @Nullable final ObjectMapper objectMapper
+  )
   {
     return new CacheStrategy<Result<TimeseriesResultValue>, Object, TimeseriesQuery>()
     {
diff --git a/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java
index 25a4284aa42..21bc336438a 100644
--- a/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java
+++ b/processing/src/main/java/org/apache/druid/query/topn/TopNQueryQueryToolChest.java
@@ -20,6 +20,7 @@
 package org.apache.druid.query.topn;
 
 import com.fasterxml.jackson.core.type.TypeReference;
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Function;
 import com.google.common.collect.Iterables;
@@ -64,6 +65,7 @@ import org.apache.druid.segment.DimensionHandlerUtils;
 import org.apache.druid.segment.column.RowSignature;
 import org.joda.time.DateTime;
 
+import javax.annotation.Nullable;
 import java.io.Closeable;
 import java.util.ArrayList;
 import java.util.Collections;
@@ -268,9 +270,18 @@ public class TopNQueryQueryToolChest extends QueryToolChest<Result<TopNResultVal
     return TYPE_REFERENCE;
   }
 
+  @Nullable
+  @Override
+  public CacheStrategy<Result<TopNResultValue>, Object, TopNQuery> getCacheStrategy(TopNQuery query)
+  {
+    return getCacheStrategy(query, null);
+  }
 
   @Override
-  public CacheStrategy<Result<TopNResultValue>, Object, TopNQuery> getCacheStrategy(final TopNQuery query)
+  public CacheStrategy<Result<TopNResultValue>, Object, TopNQuery> getCacheStrategy(
+      final TopNQuery query,
+      @Nullable final ObjectMapper objectMapper
+  )
   {
     return new CacheStrategy<Result<TopNResultValue>, Object, TopNQuery>()
     {
diff --git a/processing/src/main/java/org/apache/druid/segment/column/ObjectStrategyComplexTypeStrategy.java b/processing/src/main/java/org/apache/druid/segment/column/ObjectStrategyComplexTypeStrategy.java
index b274e55282e..f80a1cdcf8d 100644
--- a/processing/src/main/java/org/apache/druid/segment/column/ObjectStrategyComplexTypeStrategy.java
+++ b/processing/src/main/java/org/apache/druid/segment/column/ObjectStrategyComplexTypeStrategy.java
@@ -123,7 +123,7 @@ public class ObjectStrategyComplexTypeStrategy<T> implements TypeStrategy<T>
   public int hashCode(T o)
   {
     if (hashStrategy == null) {
-      throw DruidException.defensive("hashStrategy not provided");
+      throw DruidException.defensive("Type [%s] is not groupable", typeSignature.asTypeString());
     }
     return hashStrategy.hashCode(o);
   }
@@ -132,7 +132,7 @@ public class ObjectStrategyComplexTypeStrategy<T> implements TypeStrategy<T>
   public boolean equals(T a, T b)
   {
     if (hashStrategy == null) {
-      throw DruidException.defensive("hashStrategy not provided");
+      throw DruidException.defensive("Type [%s] is not groupable", typeSignature.asTypeString());
     }
     return hashStrategy.equals(a, b);
   }
@@ -141,7 +141,7 @@ public class ObjectStrategyComplexTypeStrategy<T> implements TypeStrategy<T>
   public Class<?> getClazz()
   {
     if (clazz == null) {
-      throw DruidException.defensive("hashStrategy not provided");
+      throw DruidException.defensive("Type [%s] is not groupable", typeSignature.asTypeString());
     }
     return clazz;
   }
diff --git a/processing/src/main/java/org/apache/druid/segment/column/TypeStrategies.java b/processing/src/main/java/org/apache/druid/segment/column/TypeStrategies.java
index bae29179b4d..7ac8def99ec 100644
--- a/processing/src/main/java/org/apache/druid/segment/column/TypeStrategies.java
+++ b/processing/src/main/java/org/apache/druid/segment/column/TypeStrategies.java
@@ -299,6 +299,12 @@ public class TypeStrategies
     {
       return a.equals(b);
     }
+
+    @Override
+    public Class<?> getClazz()
+    {
+      return Long.class;
+    }
   }
 
   /**
@@ -368,6 +374,12 @@ public class TypeStrategies
     {
       return a.equals(b);
     }
+
+    @Override
+    public Class<?> getClazz()
+    {
+      return Float.class;
+    }
   }
 
   /**
@@ -438,6 +450,12 @@ public class TypeStrategies
     {
       return a.equals(b);
     }
+
+    @Override
+    public Class<?> getClazz()
+    {
+      return Double.class;
+    }
   }
 
   /**
@@ -519,6 +537,12 @@ public class TypeStrategies
     {
       return a.equals(b);
     }
+
+    @Override
+    public Class<?> getClazz()
+    {
+      return String.class;
+    }
   }
 
   /**
@@ -664,5 +688,11 @@ public class TypeStrategies
         return false;
       }
     }
+
+    @Override
+    public Class<?> getClazz()
+    {
+      return Object[].class;
+    }
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/segment/column/TypeStrategy.java b/processing/src/main/java/org/apache/druid/segment/column/TypeStrategy.java
index c5cff1a0b2f..075fceca473 100644
--- a/processing/src/main/java/org/apache/druid/segment/column/TypeStrategy.java
+++ b/processing/src/main/java/org/apache/druid/segment/column/TypeStrategy.java
@@ -225,6 +225,6 @@ public interface TypeStrategy<T> extends Comparator<Object>, Hash.Strategy<T>
    */
   default Class<?> getClazz()
   {
-    throw DruidException.defensive("Not implemented. It is only implemented for complex dimensions which are groupable()");
+    throw DruidException.defensive("Not implemented. Check groupable() first");
   }
 }
diff --git a/processing/src/test/java/org/apache/druid/query/aggregation/AggregationTestHelper.java b/processing/src/test/java/org/apache/druid/query/aggregation/AggregationTestHelper.java
index 526a62c813f..2ad9f90148a 100644
--- a/processing/src/test/java/org/apache/druid/query/aggregation/AggregationTestHelper.java
+++ b/processing/src/test/java/org/apache/druid/query/aggregation/AggregationTestHelper.java
@@ -766,7 +766,7 @@ public class AggregationTestHelper implements Closeable
           String resultStr = mapper.writer().writeValueAsString(yielder);
 
           List<ResultRow> resultRows = Lists.transform(
-              readQueryResultArrayFromString(resultStr),
+              readQueryResultArrayFromString(resultStr, queryPlus.getQuery()),
               toolChest.makePreComputeManipulatorFn(
                   queryPlus.getQuery(),
                   MetricManipulatorFns.deserializing()
@@ -798,11 +798,13 @@ public class AggregationTestHelper implements Closeable
     };
   }
 
-  private List readQueryResultArrayFromString(String str) throws Exception
+  private List readQueryResultArrayFromString(String str, Query query) throws Exception
   {
     List result = new ArrayList();
 
-    JsonParser jp = mapper.getFactory().createParser(str);
+    ObjectMapper decoratedMapper = toolChest.decorateObjectMapper(mapper, query);
+
+    JsonParser jp = decoratedMapper.getFactory().createParser(str);
 
     if (jp.nextToken() != JsonToken.START_ARRAY) {
       throw new IAE("not an array [%s]", str);
diff --git a/processing/src/test/java/org/apache/druid/query/groupby/ComplexDimensionGroupByQueryTest.java b/processing/src/test/java/org/apache/druid/query/groupby/ComplexDimensionGroupByQueryTest.java
new file mode 100644
index 00000000000..bc1ecbb0ddc
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/groupby/ComplexDimensionGroupByQueryTest.java
@@ -0,0 +1,164 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.groupby;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.granularity.Granularities;
+import org.apache.druid.java.util.common.guava.Sequence;
+import org.apache.druid.java.util.common.guava.Sequences;
+import org.apache.druid.query.QueryContexts;
+import org.apache.druid.query.aggregation.AggregationTestHelper;
+import org.apache.druid.query.aggregation.CountAggregatorFactory;
+import org.apache.druid.query.aggregation.SerializablePairLongString;
+import org.apache.druid.query.aggregation.SerializablePairLongStringComplexMetricSerde;
+import org.apache.druid.query.dimension.DefaultDimensionSpec;
+import org.apache.druid.segment.RowBasedSegment;
+import org.apache.druid.segment.Segment;
+import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.column.RowSignature;
+import org.apache.druid.timeline.SegmentId;
+import org.junit.Assert;
+import org.junit.Rule;
+import org.junit.Test;
+import org.junit.rules.TemporaryFolder;
+import org.junit.runner.RunWith;
+import org.junit.runners.Parameterized;
+
+import java.util.ArrayList;
+import java.util.Collection;
+import java.util.Collections;
+import java.util.List;
+import java.util.Map;
+
+@RunWith(Parameterized.class)
+public class ComplexDimensionGroupByQueryTest
+{
+  private final QueryContexts.Vectorize vectorize;
+  private final AggregationTestHelper helper;
+  private final List<Segment> segments;
+
+  @Rule
+  public final TemporaryFolder tempFolder = new TemporaryFolder();
+
+  public ComplexDimensionGroupByQueryTest(GroupByQueryConfig config, String vectorize)
+  {
+    this.vectorize = QueryContexts.Vectorize.fromString(vectorize);
+    this.helper = AggregationTestHelper.createGroupByQueryAggregationTestHelper(
+        Collections.emptyList(),
+        config,
+        tempFolder
+    );
+    Sequence<Object[]> rows = Sequences.simple(
+        ImmutableList.of(
+            new Object[]{new SerializablePairLongString(1L, "abc")},
+            new Object[]{new SerializablePairLongString(1L, "abc")},
+            new Object[]{new SerializablePairLongString(1L, "def")},
+            new Object[]{new SerializablePairLongString(1L, "abc")},
+            new Object[]{new SerializablePairLongString(1L, "ghi")},
+            new Object[]{new SerializablePairLongString(1L, "def")},
+            new Object[]{new SerializablePairLongString(1L, "abc")},
+            new Object[]{new SerializablePairLongString(1L, "pqr")},
+            new Object[]{new SerializablePairLongString(1L, "xyz")},
+            new Object[]{new SerializablePairLongString(1L, "foo")},
+            new Object[]{new SerializablePairLongString(1L, "bar")}
+        )
+    );
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add(
+                                                "pair",
+                                                ColumnType.ofComplex(SerializablePairLongStringComplexMetricSerde.TYPE_NAME)
+                                            )
+                                            .build();
+
+    this.segments = Collections.singletonList(
+        new RowBasedSegment<>(
+            SegmentId.dummy("dummy"),
+            rows,
+            columnName -> {
+              final int columnNumber = rowSignature.indexOf(columnName);
+              return row -> columnNumber >= 0 ? row[columnNumber] : null;
+            },
+            rowSignature
+        )
+    );
+  }
+
+  @Parameterized.Parameters(name = "config = {0}, vectorize = {1}")
+  public static Collection<?> constructorFeeder()
+  {
+    final List<Object[]> constructors = new ArrayList<>();
+    for (GroupByQueryConfig config : GroupByQueryRunnerTest.testConfigs()) {
+      for (String vectorize : new String[]{"false", "force"}) {
+        constructors.add(new Object[]{config, vectorize});
+      }
+    }
+    return constructors;
+  }
+
+  public Map<String, Object> getContext()
+  {
+    return ImmutableMap.of(
+        QueryContexts.VECTORIZE_KEY, vectorize.toString(),
+        QueryContexts.VECTORIZE_VIRTUAL_COLUMNS_KEY, "true"
+    );
+  }
+
+  @Test
+  public void testGroupByOnPairClass()
+  {
+    GroupByQuery groupQuery = GroupByQuery.builder()
+                                          .setDataSource("test_datasource")
+                                          .setGranularity(Granularities.ALL)
+                                          .setInterval(Intervals.ETERNITY)
+                                          .setDimensions(new DefaultDimensionSpec(
+                                              "pair",
+                                              "pair",
+                                              ColumnType.ofComplex(SerializablePairLongStringComplexMetricSerde.TYPE_NAME)
+                                          ))
+                                          .setAggregatorSpecs(new CountAggregatorFactory("count"))
+                                          .setContext(getContext())
+                                          .build();
+
+    if (vectorize == QueryContexts.Vectorize.FORCE) {
+      // Cannot vectorize group by on complex dimension
+      Assert.assertThrows(
+          RuntimeException.class,
+          () -> helper.runQueryOnSegmentsObjs(segments, groupQuery).toList()
+      );
+    } else {
+      List<ResultRow> resultRows = helper.runQueryOnSegmentsObjs(segments, groupQuery).toList();
+
+      Assert.assertArrayEquals(
+          new ResultRow[]{
+              ResultRow.of(new SerializablePairLongString(1L, "abc"), 4L),
+              ResultRow.of(new SerializablePairLongString(1L, "bar"), 1L),
+              ResultRow.of(new SerializablePairLongString(1L, "def"), 2L),
+              ResultRow.of(new SerializablePairLongString(1L, "foo"), 1L),
+              ResultRow.of(new SerializablePairLongString(1L, "ghi"), 1L),
+              ResultRow.of(new SerializablePairLongString(1L, "pqr"), 1L),
+              ResultRow.of(new SerializablePairLongString(1L, "xyz"), 1L)
+          },
+          resultRows.toArray()
+      );
+    }
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChestTest.java b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChestTest.java
index f43bbce9d97..7279ca938bd 100644
--- a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChestTest.java
+++ b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryQueryToolChestTest.java
@@ -33,6 +33,7 @@ import org.apache.druid.collections.SerializablePair;
 import org.apache.druid.collections.StupidPool;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.Row;
+import org.apache.druid.jackson.AggregatorsModule;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.Granularities;
@@ -97,6 +98,7 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
   public static void setUpClass()
   {
     NullHandling.initializeForTests();
+    AggregatorsModule.registerComplexMetricsAndSerde();
   }
 
   @Test
@@ -130,11 +132,13 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         .setGranularity(QueryRunnerTestHelper.DAY_GRAN)
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
+
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy1 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy2 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2, mapper);
 
     Assert.assertTrue(Arrays.equals(strategy1.computeCacheKey(query1), strategy2.computeCacheKey(query2)));
     Assert.assertFalse(Arrays.equals(
@@ -190,11 +194,12 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         )
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy1 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy2 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2, mapper);
 
     Assert.assertTrue(Arrays.equals(strategy1.computeCacheKey(query1), strategy2.computeCacheKey(query2)));
     Assert.assertFalse(Arrays.equals(
@@ -252,11 +257,12 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         .setHavingSpec(new GreaterThanHavingSpec(QueryRunnerTestHelper.UNIQUE_METRIC, 10))
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy1 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy2 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2, mapper);
 
     Assert.assertTrue(Arrays.equals(strategy1.computeCacheKey(query1), strategy2.computeCacheKey(query2)));
     Assert.assertFalse(Arrays.equals(
@@ -336,11 +342,12 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         .setHavingSpec(andHavingSpec2)
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy1 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy2 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2, mapper);
 
     Assert.assertTrue(Arrays.equals(strategy1.computeCacheKey(query1), strategy2.computeCacheKey(query2)));
     Assert.assertFalse(Arrays.equals(
@@ -427,11 +434,12 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         .setHavingSpec(havingSpec2)
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy1 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy2 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2, mapper);
 
     Assert.assertTrue(Arrays.equals(strategy1.computeCacheKey(query1), strategy2.computeCacheKey(query2)));
     Assert.assertFalse(Arrays.equals(
@@ -490,11 +498,12 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         ))
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy1 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy2 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2, mapper);
 
     Assert.assertTrue(Arrays.equals(strategy1.computeCacheKey(query1), strategy2.computeCacheKey(query2)));
     Assert.assertFalse(Arrays.equals(
@@ -512,6 +521,48 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
     doTestCacheStrategy(ColumnType.LONG, 2L);
   }
 
+  @Test
+  public void testComplexDimensionCacheStrategy() throws IOException
+  {
+    final GroupByQuery query1 = GroupByQuery
+        .builder()
+        .setDataSource(QueryRunnerTestHelper.DATA_SOURCE)
+        .setQuerySegmentSpec(QueryRunnerTestHelper.FIRST_TO_THIRD)
+        .setDimensions(ImmutableList.of(
+            new DefaultDimensionSpec(
+                "test",
+                "test",
+                ColumnType.ofComplex(SerializablePairLongStringComplexMetricSerde.TYPE_NAME)
+            )
+        ))
+        .setAggregatorSpecs(QueryRunnerTestHelper.ROWS_COUNT)
+        .setGranularity(QueryRunnerTestHelper.DAY_GRAN)
+        .build();
+
+    ObjectMapper objectMapper = TestHelper.makeJsonMapper();
+
+    CacheStrategy<ResultRow, Object, GroupByQuery> strategy =
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, objectMapper);
+
+    // test timestamps that result in integer size millis
+    final ResultRow result1 = ResultRow.of(
+        123L,
+        new SerializablePairLongString(123L, "abc"),
+        1
+    );
+
+    Object preparedValue = strategy.prepareForSegmentLevelCache().apply(result1);
+
+    Object fromCacheValue = objectMapper.readValue(
+        objectMapper.writeValueAsBytes(preparedValue),
+        strategy.getCacheObjectClazz()
+    );
+
+    ResultRow fromCacheResult = strategy.pullFromSegmentLevelCache().apply(fromCacheValue);
+
+    Assert.assertEquals(result1, fromCacheResult);
+  }
+
   @Test
   public void testMultiColumnCacheStrategy() throws Exception
   {
@@ -538,8 +589,9 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         .setGranularity(QueryRunnerTestHelper.DAY_GRAN)
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
     CacheStrategy<ResultRow, Object, GroupByQuery> strategy =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     // test timestamps that result in integer size millis
     final ResultRow result1 = ResultRow.of(
@@ -1054,8 +1106,9 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         .setGranularity(QueryRunnerTestHelper.DAY_GRAN)
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
     CacheStrategy<ResultRow, Object, GroupByQuery> strategy =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     // test timestamps that result in integer size millis
     final ResultRow result1 = ResultRow.of(
@@ -1147,11 +1200,12 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         .setGranularity(QueryRunnerTestHelper.DAY_GRAN)
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy1 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy2 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2, mapper);
 
     Assert.assertFalse(Arrays.equals(strategy1.computeCacheKey(query1), strategy2.computeCacheKey(query2)));
     Assert.assertFalse(Arrays.equals(
@@ -1183,11 +1237,12 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         .overrideContext(ImmutableMap.of(GroupByQueryConfig.CTX_KEY_APPLY_LIMIT_PUSH_DOWN, "false"))
         .build();
 
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy1 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query1, mapper);
 
     final CacheStrategy<ResultRow, Object, GroupByQuery> strategy2 =
-        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2);
+        new GroupByQueryQueryToolChest(null, null).getCacheStrategy(query2, mapper);
 
     Assert.assertFalse(Arrays.equals(strategy1.computeCacheKey(query1), strategy2.computeCacheKey(query2)));
     Assert.assertTrue(
@@ -1245,7 +1300,8 @@ public class GroupByQueryQueryToolChestTest extends InitializedNullHandlingTest
         QueryRunnerTestHelper.NOOP_QUERYWATCHER
     );
     final GroupByQueryQueryToolChest queryToolChest = new GroupByQueryQueryToolChest(groupingEngine, groupByResourcesReservationPool);
-    CacheStrategy<ResultRow, Object, GroupByQuery> cacheStrategy = queryToolChest.getCacheStrategy(query);
+    final ObjectMapper mapper = TestHelper.makeJsonMapper();
+    CacheStrategy<ResultRow, Object, GroupByQuery> cacheStrategy = queryToolChest.getCacheStrategy(query, mapper);
     Assert.assertTrue(
         "result level cache on broker server for GroupByStrategyV2 should be enabled",
         cacheStrategy.isCacheable(query, false, false)
diff --git a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java
index d4dc8734130..a5dbb49bca5 100644
--- a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java
+++ b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java
@@ -33,6 +33,7 @@ import com.google.common.collect.Sets;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.Row;
 import org.apache.druid.data.input.Rows;
+import org.apache.druid.error.DruidException;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.HumanReadableBytes;
 import org.apache.druid.java.util.common.IAE;
@@ -9965,7 +9966,6 @@ public class GroupByQueryRunnerTest extends InitializedNullHandlingTest
   @Test
   public void testGroupByComplexColumn()
   {
-    cannotVectorize();
     GroupByQuery query = makeQueryBuilder()
         .setDataSource(QueryRunnerTestHelper.DATA_SOURCE)
         .setQuerySegmentSpec(QueryRunnerTestHelper.FIRST_TO_THIRD)
@@ -9979,7 +9979,8 @@ public class GroupByQueryRunnerTest extends InitializedNullHandlingTest
         .setGranularity(QueryRunnerTestHelper.ALL_GRAN)
         .build();
 
-    expectedException.expect(RuntimeException.class);
+    expectedException.expect(DruidException.class);
+    expectedException.expectMessage("Type [COMPLEX<hyperUnique>] is not groupable");
     GroupByQueryRunnerTestHelper.runQuery(factory, runner, query);
   }
 
diff --git a/server/src/main/java/org/apache/druid/client/CachingClusteredClient.java b/server/src/main/java/org/apache/druid/client/CachingClusteredClient.java
index 7bcb4c2ce03..5fa34d6699d 100644
--- a/server/src/main/java/org/apache/druid/client/CachingClusteredClient.java
+++ b/server/src/main/java/org/apache/druid/client/CachingClusteredClient.java
@@ -275,7 +275,7 @@ public class CachingClusteredClient implements QuerySegmentWalker
       this.responseContext = responseContext;
       this.query = queryPlus.getQuery();
       this.toolChest = warehouse.getToolChest(query);
-      this.strategy = toolChest.getCacheStrategy(query);
+      this.strategy = toolChest.getCacheStrategy(query, objectMapper);
       this.dataSourceAnalysis = query.getDataSource().getAnalysis();
 
       this.useCache = CacheUtil.isUseSegmentCache(query, strategy, cacheConfig, CacheUtil.ServerType.BROKER);
diff --git a/server/src/main/java/org/apache/druid/client/CachingQueryRunner.java b/server/src/main/java/org/apache/druid/client/CachingQueryRunner.java
index 9bb9f474dd9..41d4bb4ea63 100644
--- a/server/src/main/java/org/apache/druid/client/CachingQueryRunner.java
+++ b/server/src/main/java/org/apache/druid/client/CachingQueryRunner.java
@@ -86,7 +86,7 @@ public class CachingQueryRunner<T> implements QueryRunner<T>
   public Sequence<T> run(QueryPlus<T> queryPlus, ResponseContext responseContext)
   {
     Query<T> query = queryPlus.getQuery();
-    final CacheStrategy strategy = toolChest.getCacheStrategy(query);
+    final CacheStrategy strategy = toolChest.getCacheStrategy(query, mapper);
     final boolean populateCache = canPopulateCache(query, strategy);
     final boolean useCache = canUseCache(query, strategy);
 
diff --git a/server/src/main/java/org/apache/druid/query/ResultLevelCachingQueryRunner.java b/server/src/main/java/org/apache/druid/query/ResultLevelCachingQueryRunner.java
index 182faba7a09..0af6ebca3ed 100644
--- a/server/src/main/java/org/apache/druid/query/ResultLevelCachingQueryRunner.java
+++ b/server/src/main/java/org/apache/druid/query/ResultLevelCachingQueryRunner.java
@@ -73,7 +73,7 @@ public class ResultLevelCachingQueryRunner<T> implements QueryRunner<T>
     this.cache = cache;
     this.cacheConfig = cacheConfig;
     this.query = query;
-    this.strategy = queryToolChest.getCacheStrategy(query);
+    this.strategy = queryToolChest.getCacheStrategy(query, objectMapper);
     this.populateResultCache = CacheUtil.isPopulateResultCache(
         query,
         strategy,
diff --git a/server/src/test/java/org/apache/druid/client/CachingQueryRunnerTest.java b/server/src/test/java/org/apache/druid/client/CachingQueryRunnerTest.java
index a4375a61900..7208ab2fc4b 100644
--- a/server/src/test/java/org/apache/druid/client/CachingQueryRunnerTest.java
+++ b/server/src/test/java/org/apache/druid/client/CachingQueryRunnerTest.java
@@ -68,6 +68,7 @@ import org.apache.druid.query.topn.TopNQueryBuilder;
 import org.apache.druid.query.topn.TopNQueryConfig;
 import org.apache.druid.query.topn.TopNQueryQueryToolChest;
 import org.apache.druid.query.topn.TopNResultValue;
+import org.apache.druid.testing.InitializedNullHandlingTest;
 import org.easymock.EasyMock;
 import org.joda.time.DateTime;
 import org.junit.Assert;
@@ -90,7 +91,7 @@ import java.util.concurrent.TimeUnit;
 import java.util.concurrent.atomic.AtomicBoolean;
 
 @RunWith(Parameterized.class)
-public class CachingQueryRunnerTest
+public class CachingQueryRunnerTest extends InitializedNullHandlingTest
 {
   @Parameterized.Parameters(name = "numBackgroundThreads={0}")
   public static Iterable<Object[]> constructorFeeder()
@@ -222,8 +223,8 @@ public class CachingQueryRunnerTest
     Cache cache = EasyMock.mock(Cache.class);
     EasyMock.replay(cache);
     CachingQueryRunner queryRunner = makeCachingQueryRunner(null, cache, toolchest, Sequences.empty());
-    Assert.assertFalse(queryRunner.canPopulateCache(query, toolchest.getCacheStrategy(query)));
-    Assert.assertFalse(queryRunner.canUseCache(query, toolchest.getCacheStrategy(query)));
+    Assert.assertFalse(queryRunner.canPopulateCache(query, toolchest.getCacheStrategy(query, null)));
+    Assert.assertFalse(queryRunner.canUseCache(query, toolchest.getCacheStrategy(query, null)));
     queryRunner.run(QueryPlus.wrap(query));
     EasyMock.verifyUnexpectedCalls(cache);
   }
@@ -243,7 +244,7 @@ public class CachingQueryRunnerTest
 
     QueryToolChest toolchest = EasyMock.mock(QueryToolChest.class);
     Cache cache = EasyMock.mock(Cache.class);
-    EasyMock.expect(toolchest.getCacheStrategy(query)).andReturn(null);
+    EasyMock.expect(toolchest.getCacheStrategy(EasyMock.eq(query), EasyMock.anyObject())).andReturn(null);
     EasyMock.replay(cache, toolchest);
     CachingQueryRunner queryRunner = makeCachingQueryRunner(new byte[0], cache, toolchest, Sequences.empty());
     Assert.assertFalse(queryRunner.canPopulateCache(query, null));
@@ -339,7 +340,7 @@ public class CachingQueryRunnerTest
         resultSeq
     );
 
-    CacheStrategy cacheStrategy = toolchest.getCacheStrategy(query);
+    CacheStrategy cacheStrategy = toolchest.getCacheStrategy(query, null);
     Cache.NamedKey cacheKey = CacheUtil.computeSegmentCacheKey(
         CACHE_ID,
         SEGMENT_DESCRIPTOR,
@@ -383,7 +384,7 @@ public class CachingQueryRunnerTest
 
     byte[] cacheKeyPrefix = RandomUtils.nextBytes(10);
 
-    CacheStrategy cacheStrategy = toolchest.getCacheStrategy(query);
+    CacheStrategy cacheStrategy = toolchest.getCacheStrategy(query, null);
     Cache.NamedKey cacheKey = CacheUtil.computeSegmentCacheKey(
         CACHE_ID,
         SEGMENT_DESCRIPTOR,
@@ -399,7 +400,7 @@ public class CachingQueryRunnerTest
         toolchest,
         Sequences.empty()
     );
-    Assert.assertTrue(runner.canUseCache(query, toolchest.getCacheStrategy(query)));
+    Assert.assertTrue(runner.canUseCache(query, toolchest.getCacheStrategy(query, null)));
     List<Result> results = runner.run(QueryPlus.wrap(query)).toList();
     Assert.assertEquals(expectedResults.toString(), results.toString());
   }

From 64104533acf744bf3b596a9770beb17aedc374df Mon Sep 17 00:00:00 2001
From: Rishabh Singh <6513075+findingrish@users.noreply.github.com>
Date: Mon, 15 Jul 2024 15:02:59 +0530
Subject: [PATCH 68/72] Enable querying entirely cold datasources  (#16676)

Add ability to query entirely cold datasources.
---
 .../client/coordinator/CoordinatorClient.java |   5 +
 .../coordinator/CoordinatorClientImpl.java    |  13 +
 .../AbstractSegmentMetadataCache.java         |  16 +-
 .../CoordinatorSegmentMetadataCache.java      | 220 +++++++-
 .../server/coordinator/DruidCoordinator.java  |   3 +
 .../coordinator/NoopCoordinatorClient.java    |   6 +
 ...inatorSegmentDataCacheConcurrencyTest.java |  23 +-
 .../CoordinatorSegmentMetadataCacheTest.java  | 479 +++++++++++++++++-
 .../schema/BrokerSegmentMetadataCache.java    |  41 +-
 .../BrokerSegmentMetadataCacheTest.java       |  89 +++-
 10 files changed, 853 insertions(+), 42 deletions(-)

diff --git a/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClient.java b/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClient.java
index fdf16b2ac50..edeb16665ba 100644
--- a/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClient.java
+++ b/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClient.java
@@ -69,4 +69,9 @@ public interface CoordinatorClient
    * Returns a new instance backed by a ServiceClient which follows the provided retryPolicy
    */
   CoordinatorClient withRetryPolicy(ServiceRetryPolicy retryPolicy);
+
+  /**
+   * Retrieves list of datasources with used segments.
+   */
+  ListenableFuture<Set<String>> fetchDataSourcesWithUsedSegments();
 }
diff --git a/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClientImpl.java b/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClientImpl.java
index 4c795c9dbd4..fc3deee12ed 100644
--- a/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClientImpl.java
+++ b/server/src/main/java/org/apache/druid/client/coordinator/CoordinatorClientImpl.java
@@ -188,4 +188,17 @@ public class CoordinatorClientImpl implements CoordinatorClient
   {
     return new CoordinatorClientImpl(client.withRetryPolicy(retryPolicy), jsonMapper);
   }
+
+  @Override
+  public ListenableFuture<Set<String>> fetchDataSourcesWithUsedSegments()
+  {
+    final String path = "/druid/coordinator/v1/metadata/datasources";
+    return FutureUtils.transform(
+        client.asyncRequest(
+            new RequestBuilder(HttpMethod.GET, path),
+            new BytesFullResponseHandler()
+        ),
+        holder -> JacksonUtils.readValue(jsonMapper, holder.getContent(), new TypeReference<Set<String>>() {})
+    );
+  }
 }
diff --git a/server/src/main/java/org/apache/druid/segment/metadata/AbstractSegmentMetadataCache.java b/server/src/main/java/org/apache/druid/segment/metadata/AbstractSegmentMetadataCache.java
index 9cb2297db82..88e6ee97b98 100644
--- a/server/src/main/java/org/apache/druid/segment/metadata/AbstractSegmentMetadataCache.java
+++ b/server/src/main/java/org/apache/druid/segment/metadata/AbstractSegmentMetadataCache.java
@@ -200,7 +200,7 @@ public abstract class AbstractSegmentMetadataCache<T extends DataSourceInformati
    * Map of datasource and generic object extending DataSourceInformation.
    * This structure can be accessed by {@link #cacheExec} and {@link #callbackExec} threads.
    */
-  protected final ConcurrentMap<String, T> tables = new ConcurrentHashMap<>();
+  protected final ConcurrentHashMap<String, T> tables = new ConcurrentHashMap<>();
 
   /**
    * This lock coordinates the access from multiple threads to those variables guarded by this lock.
@@ -269,9 +269,10 @@ public abstract class AbstractSegmentMetadataCache<T extends DataSourceInformati
               final boolean wasRecentFailure = DateTimes.utc(lastFailure)
                                                         .plus(config.getMetadataRefreshPeriod())
                                                         .isAfterNow();
+
               if (isServerViewInitialized &&
                   !wasRecentFailure &&
-                  (!segmentsNeedingRefresh.isEmpty() || !dataSourcesNeedingRebuild.isEmpty()) &&
+                  shouldRefresh() &&
                   (refreshImmediately || nextRefresh < System.currentTimeMillis())) {
                 // We need to do a refresh. Break out of the waiting loop.
                 break;
@@ -334,6 +335,7 @@ public abstract class AbstractSegmentMetadataCache<T extends DataSourceInformati
     }
   }
 
+
   /**
    * Lifecycle start method.
    */
@@ -361,6 +363,15 @@ public abstract class AbstractSegmentMetadataCache<T extends DataSourceInformati
     // noop
   }
 
+  /**
+   * Refresh is executed only when there are segments or datasources needing refresh.
+   */
+  @SuppressWarnings("GuardedBy")
+  protected boolean shouldRefresh()
+  {
+    return (!segmentsNeedingRefresh.isEmpty() || !dataSourcesNeedingRebuild.isEmpty());
+  }
+
   public void awaitInitialization() throws InterruptedException
   {
     initialized.await();
@@ -373,6 +384,7 @@ public abstract class AbstractSegmentMetadataCache<T extends DataSourceInformati
    *
    * @return schema information for the given datasource
    */
+  @Nullable
   public T getDatasource(String name)
   {
     return tables.get(name);
diff --git a/server/src/main/java/org/apache/druid/segment/metadata/CoordinatorSegmentMetadataCache.java b/server/src/main/java/org/apache/druid/segment/metadata/CoordinatorSegmentMetadataCache.java
index dad0b78ea77..3a4f548b8ba 100644
--- a/server/src/main/java/org/apache/druid/segment/metadata/CoordinatorSegmentMetadataCache.java
+++ b/server/src/main/java/org/apache/druid/segment/metadata/CoordinatorSegmentMetadataCache.java
@@ -20,19 +20,27 @@
 package org.apache.druid.segment.metadata;
 
 import com.google.common.annotations.VisibleForTesting;
+import com.google.common.base.Supplier;
+import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.Maps;
 import com.google.common.collect.Sets;
+import com.google.common.util.concurrent.ThreadFactoryBuilder;
 import com.google.inject.Inject;
 import org.apache.druid.client.CoordinatorServerView;
+import org.apache.druid.client.ImmutableDruidDataSource;
 import org.apache.druid.client.InternalQueryConfig;
 import org.apache.druid.client.ServerView;
 import org.apache.druid.client.TimelineServerView;
 import org.apache.druid.guice.ManageLifecycle;
 import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.Stopwatch;
+import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.lifecycle.LifecycleStart;
 import org.apache.druid.java.util.common.lifecycle.LifecycleStop;
 import org.apache.druid.java.util.emitter.EmittingLogger;
 import org.apache.druid.java.util.emitter.service.ServiceEmitter;
+import org.apache.druid.metadata.SegmentsMetadataManagerConfig;
+import org.apache.druid.metadata.SqlSegmentsMetadataManager;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.metadata.metadata.SegmentAnalysis;
 import org.apache.druid.segment.SchemaPayloadPlus;
@@ -41,21 +49,30 @@ import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.segment.realtime.appenderator.SegmentSchemas;
 import org.apache.druid.server.QueryLifecycleFactory;
 import org.apache.druid.server.coordination.DruidServerMetadata;
+import org.apache.druid.server.coordinator.loading.SegmentReplicaCount;
+import org.apache.druid.server.coordinator.loading.SegmentReplicationStatus;
 import org.apache.druid.server.security.Escalator;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.SegmentId;
 
 import javax.annotation.Nullable;
 import java.io.IOException;
+import java.util.ArrayList;
+import java.util.Collection;
 import java.util.Collections;
+import java.util.HashMap;
 import java.util.HashSet;
 import java.util.LinkedHashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.Optional;
 import java.util.Set;
+import java.util.concurrent.ConcurrentHashMap;
 import java.util.concurrent.ConcurrentSkipListMap;
+import java.util.concurrent.Executors;
 import java.util.concurrent.Future;
+import java.util.concurrent.ScheduledExecutorService;
+import java.util.concurrent.TimeUnit;
 import java.util.concurrent.atomic.AtomicBoolean;
 
 /**
@@ -71,17 +88,36 @@ import java.util.concurrent.atomic.AtomicBoolean;
  * <ul><li>Metadata query is executed only for those non-realtime segments for which the schema is not cached.</li>
  * <li>Datasources marked for refresh are then rebuilt.</li></ul>
  * </li>
+ * <p>
+ * It is important to note that the datasource schema returned in {@link #getDatasource} & {@link #getDataSourceInformationMap()}
+ * also includes columns from cold segments.
+ * Cold segments are processed in a separate thread and datasource schema from cold segments is separately stored.
+ * </p>
  */
 @ManageLifecycle
 public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCache<DataSourceInformation>
 {
   private static final EmittingLogger log = new EmittingLogger(CoordinatorSegmentMetadataCache.class);
+  private static final Long COLD_SCHEMA_PERIOD_MULTIPLIER = 3L;
+  private static final Long COLD_SCHEMA_SLOWNESS_THRESHOLD_MILLIS = TimeUnit.SECONDS.toMillis(50);
 
   private final SegmentMetadataCacheConfig config;
   private final ColumnTypeMergePolicy columnTypeMergePolicy;
   private final SegmentSchemaCache segmentSchemaCache;
   private final SegmentSchemaBackFillQueue segmentSchemaBackfillQueue;
+  private final SqlSegmentsMetadataManager sqlSegmentsMetadataManager;
+  private volatile SegmentReplicationStatus segmentReplicationStatus = null;
+
+  // Datasource schema built from only cold segments.
+  private final ConcurrentHashMap<String, DataSourceInformation> coldSchemaTable = new ConcurrentHashMap<>();
+
+  // Period for cold schema processing thread. This is a multiple of segment polling period.
+  // Cold schema processing runs slower than the segment poll to save processing cost of all segments.
+  // The downside is a delay in columns from cold segment reflecting in the datasource schema.
+  private final long coldSchemaExecPeriodMillis;
+  private final ScheduledExecutorService coldSchemaExec;
   private @Nullable Future<?> cacheExecFuture = null;
+  private @Nullable Future<?> coldSchemaExecFuture = null;
 
   @Inject
   public CoordinatorSegmentMetadataCache(
@@ -92,7 +128,9 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
       InternalQueryConfig internalQueryConfig,
       ServiceEmitter emitter,
       SegmentSchemaCache segmentSchemaCache,
-      SegmentSchemaBackFillQueue segmentSchemaBackfillQueue
+      SegmentSchemaBackFillQueue segmentSchemaBackfillQueue,
+      SqlSegmentsMetadataManager sqlSegmentsMetadataManager,
+      Supplier<SegmentsMetadataManagerConfig> segmentsMetadataManagerConfigSupplier
   )
   {
     super(queryLifecycleFactory, config, escalator, internalQueryConfig, emitter);
@@ -100,6 +138,15 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
     this.columnTypeMergePolicy = config.getMetadataColumnTypeMergePolicy();
     this.segmentSchemaCache = segmentSchemaCache;
     this.segmentSchemaBackfillQueue = segmentSchemaBackfillQueue;
+    this.sqlSegmentsMetadataManager = sqlSegmentsMetadataManager;
+    this.coldSchemaExecPeriodMillis =
+        segmentsMetadataManagerConfigSupplier.get().getPollDuration().getMillis() * COLD_SCHEMA_PERIOD_MULTIPLIER;
+    coldSchemaExec = Executors.newSingleThreadScheduledExecutor(
+        new ThreadFactoryBuilder()
+            .setNameFormat("DruidColdSchema-ScheduledExecutor-%d")
+            .setDaemon(false)
+            .build()
+    );
 
     initServerViewTimelineCallback(serverView);
   }
@@ -168,11 +215,15 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
   {
     callbackExec.shutdownNow();
     cacheExec.shutdownNow();
+    coldSchemaExec.shutdownNow();
     segmentSchemaCache.onLeaderStop();
     segmentSchemaBackfillQueue.onLeaderStop();
     if (cacheExecFuture != null) {
       cacheExecFuture.cancel(true);
     }
+    if (coldSchemaExecFuture != null) {
+      coldSchemaExecFuture.cancel(true);
+    }
   }
 
   public void onLeaderStart()
@@ -181,6 +232,12 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
     try {
       segmentSchemaBackfillQueue.onLeaderStart();
       cacheExecFuture = cacheExec.submit(this::cacheExecLoop);
+      coldSchemaExecFuture = coldSchemaExec.schedule(
+          this::coldDatasourceSchemaExec,
+          coldSchemaExecPeriodMillis,
+          TimeUnit.MILLISECONDS
+      );
+
       if (config.isAwaitInitializationOnStart()) {
         awaitInitialization();
       }
@@ -196,6 +253,9 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
     if (cacheExecFuture != null) {
       cacheExecFuture.cancel(true);
     }
+    if (coldSchemaExecFuture != null) {
+      coldSchemaExecFuture.cancel(true);
+    }
     segmentSchemaCache.onLeaderStop();
     segmentSchemaBackfillQueue.onLeaderStop();
   }
@@ -209,6 +269,11 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
     segmentSchemaCache.awaitInitialization();
   }
 
+  public void updateSegmentReplicationStatus(SegmentReplicationStatus segmentReplicationStatus)
+  {
+    this.segmentReplicationStatus = segmentReplicationStatus;
+  }
+
   @Override
   protected void unmarkSegmentAsMutable(SegmentId segmentId)
   {
@@ -336,6 +401,62 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
     return availableSegmentMetadata;
   }
 
+  @Override
+  public DataSourceInformation getDatasource(String name)
+  {
+    return getMergedDatasourceInformation(tables.get(name), coldSchemaTable.get(name)).orElse(null);
+  }
+
+  @Override
+  public Map<String, DataSourceInformation> getDataSourceInformationMap()
+  {
+    Map<String, DataSourceInformation> hot = new HashMap<>(tables);
+    Map<String, DataSourceInformation> cold = new HashMap<>(coldSchemaTable);
+    Set<String> combinedDatasources = new HashSet<>(hot.keySet());
+    combinedDatasources.addAll(cold.keySet());
+    ImmutableMap.Builder<String, DataSourceInformation> combined = ImmutableMap.builder();
+
+    for (String dataSource : combinedDatasources) {
+      getMergedDatasourceInformation(hot.get(dataSource), cold.get(dataSource))
+          .ifPresent(merged -> combined.put(
+              dataSource,
+              merged
+          ));
+    }
+
+    return combined.build();
+  }
+
+  private Optional<DataSourceInformation> getMergedDatasourceInformation(
+      final DataSourceInformation hot,
+      final DataSourceInformation cold
+  )
+  {
+    if (hot == null && cold == null) {
+      return Optional.empty();
+    } else if (hot != null && cold == null) {
+      return Optional.of(hot);
+    } else if (hot == null && cold != null) {
+      return Optional.of(cold);
+    } else {
+      final Map<String, ColumnType> columnTypes = new LinkedHashMap<>();
+
+      List<RowSignature> signatures = new ArrayList<>();
+      // hot datasource schema takes precedence
+      signatures.add(hot.getRowSignature());
+      signatures.add(cold.getRowSignature());
+
+      for (RowSignature signature : signatures) {
+        mergeRowSignature(columnTypes, signature);
+      }
+
+      final RowSignature.Builder builder = RowSignature.builder();
+      columnTypes.forEach(builder::add);
+
+      return Optional.of(new DataSourceInformation(hot.getDataSource(), builder.build()));
+    }
+  }
+
   /**
    * Executes SegmentMetadataQuery to fetch schema information for each segment in the refresh list.
    * The schema information for individual segments is combined to construct a table schema, which is then cached.
@@ -382,6 +503,7 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
     // Rebuild the datasources.
     for (String dataSource : dataSourcesToRebuild) {
       final RowSignature rowSignature = buildDataSourceRowSignature(dataSource);
+
       if (rowSignature == null) {
         log.info("RowSignature null for dataSource [%s], implying that it no longer exists. All metadata removed.", dataSource);
         tables.remove(dataSource);
@@ -419,6 +541,94 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
     return cachedSegments;
   }
 
+  @Nullable
+  private Integer getReplicationFactor(SegmentId segmentId)
+  {
+    if (segmentReplicationStatus == null) {
+      return null;
+    }
+    SegmentReplicaCount replicaCountsInCluster = segmentReplicationStatus.getReplicaCountsInCluster(segmentId);
+    return replicaCountsInCluster == null ? null : replicaCountsInCluster.required();
+  }
+
+  @VisibleForTesting
+  protected void coldDatasourceSchemaExec()
+  {
+    Stopwatch stopwatch = Stopwatch.createStarted();
+
+    Set<String> dataSourceWithColdSegmentSet = new HashSet<>();
+
+    int datasources = 0;
+    int segments = 0;
+    int dataSourceWithColdSegments = 0;
+
+    Collection<ImmutableDruidDataSource> immutableDataSources =
+        sqlSegmentsMetadataManager.getImmutableDataSourcesWithAllUsedSegments();
+
+    for (ImmutableDruidDataSource dataSource : immutableDataSources) {
+      datasources++;
+      Collection<DataSegment> dataSegments = dataSource.getSegments();
+
+      final Map<String, ColumnType> columnTypes = new LinkedHashMap<>();
+
+      for (DataSegment segment : dataSegments) {
+        Integer replicationFactor = getReplicationFactor(segment.getId());
+        if (replicationFactor != null && replicationFactor != 0) {
+          continue;
+        }
+        Optional<SchemaPayloadPlus> optionalSchema = segmentSchemaCache.getSchemaForSegment(segment.getId());
+        if (optionalSchema.isPresent()) {
+          RowSignature rowSignature = optionalSchema.get().getSchemaPayload().getRowSignature();
+          mergeRowSignature(columnTypes, rowSignature);
+        }
+        segments++;
+      }
+
+      if (columnTypes.isEmpty()) {
+        // this datasource doesn't have any cold segment
+        continue;
+      }
+
+      final RowSignature.Builder builder = RowSignature.builder();
+      columnTypes.forEach(builder::add);
+
+      RowSignature coldSignature = builder.build();
+
+      String dataSourceName = dataSource.getName();
+      dataSourceWithColdSegmentSet.add(dataSourceName);
+      dataSourceWithColdSegments++;
+
+      log.debug("[%s] signature from cold segments is [%s]", dataSourceName, coldSignature);
+
+      coldSchemaTable.put(dataSourceName, new DataSourceInformation(dataSourceName, coldSignature));
+    }
+
+    // remove any stale datasource from the map
+    coldSchemaTable.keySet().retainAll(dataSourceWithColdSegmentSet);
+
+    String executionStatsLog = StringUtils.format(
+        "Cold schema processing took [%d] millis. "
+        + "Processed total [%d] datasources, [%d] segments. Found [%d] datasources with cold segments.",
+        stopwatch.millisElapsed(), datasources, segments, dataSourceWithColdSegments
+    );
+    if (stopwatch.millisElapsed() > COLD_SCHEMA_SLOWNESS_THRESHOLD_MILLIS) {
+      log.info(executionStatsLog);
+    } else {
+      log.debug(executionStatsLog);
+    }
+  }
+
+  private void mergeRowSignature(final Map<String, ColumnType> columnTypes, final RowSignature signature)
+  {
+    for (String column : signature.getColumnNames()) {
+      final ColumnType columnType =
+          signature.getColumnType(column)
+                   .orElseThrow(() -> new ISE("Encountered null type for column [%s]", column));
+
+      columnTypes.compute(column, (c, existingType) -> columnTypeMergePolicy.merge(existingType, columnType));
+    }
+  }
+
   @VisibleForTesting
   @Nullable
   @Override
@@ -434,13 +644,7 @@ public class CoordinatorSegmentMetadataCache extends AbstractSegmentMetadataCach
         Optional<SchemaPayloadPlus> optionalSchema = segmentSchemaCache.getSchemaForSegment(segmentId);
         if (optionalSchema.isPresent()) {
           RowSignature rowSignature = optionalSchema.get().getSchemaPayload().getRowSignature();
-          for (String column : rowSignature.getColumnNames()) {
-            final ColumnType columnType =
-                rowSignature.getColumnType(column)
-                            .orElseThrow(() -> new ISE("Encountered null type for column [%s]", column));
-
-            columnTypes.compute(column, (c, existingType) -> columnTypeMergePolicy.merge(existingType, columnType));
-          }
+          mergeRowSignature(columnTypes, rowSignature);
         } else {
           // mark it for refresh, however, this case shouldn't arise by design
           markSegmentAsNeedRefresh(segmentId);
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinator.java b/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinator.java
index 36cfac8089c..9710bda79b4 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinator.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/DruidCoordinator.java
@@ -816,6 +816,9 @@ public class DruidCoordinator
     {
       broadcastSegments = params.getBroadcastSegments();
       segmentReplicationStatus = params.getSegmentReplicationStatus();
+      if (coordinatorSegmentMetadataCache != null) {
+        coordinatorSegmentMetadataCache.updateSegmentReplicationStatus(segmentReplicationStatus);
+      }
 
       // Collect stats for unavailable and under-replicated segments
       final CoordinatorRunStats stats = params.getCoordinatorStats();
diff --git a/server/src/test/java/org/apache/druid/client/coordinator/NoopCoordinatorClient.java b/server/src/test/java/org/apache/druid/client/coordinator/NoopCoordinatorClient.java
index 5aee343a851..58f5af58a3e 100644
--- a/server/src/test/java/org/apache/druid/client/coordinator/NoopCoordinatorClient.java
+++ b/server/src/test/java/org/apache/druid/client/coordinator/NoopCoordinatorClient.java
@@ -75,4 +75,10 @@ public class NoopCoordinatorClient implements CoordinatorClient
     // Ignore retryPolicy for the test client.
     return this;
   }
+
+  @Override
+  public ListenableFuture<Set<String>> fetchDataSourcesWithUsedSegments()
+  {
+    throw new UnsupportedOperationException();
+  }
 }
diff --git a/server/src/test/java/org/apache/druid/segment/metadata/CoordinatorSegmentDataCacheConcurrencyTest.java b/server/src/test/java/org/apache/druid/segment/metadata/CoordinatorSegmentDataCacheConcurrencyTest.java
index 81f65acf84a..4cc4ac38184 100644
--- a/server/src/test/java/org/apache/druid/segment/metadata/CoordinatorSegmentDataCacheConcurrencyTest.java
+++ b/server/src/test/java/org/apache/druid/segment/metadata/CoordinatorSegmentDataCacheConcurrencyTest.java
@@ -20,6 +20,8 @@
 package org.apache.druid.segment.metadata;
 
 import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.base.Supplier;
+import com.google.common.base.Suppliers;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.Sets;
 import org.apache.druid.client.BrokerServerView;
@@ -39,6 +41,8 @@ import org.apache.druid.java.util.common.NonnullPair;
 import org.apache.druid.java.util.common.concurrent.Execs;
 import org.apache.druid.java.util.common.concurrent.ScheduledExecutors;
 import org.apache.druid.java.util.emitter.service.ServiceEmitter;
+import org.apache.druid.metadata.SegmentsMetadataManagerConfig;
+import org.apache.druid.metadata.SqlSegmentsMetadataManager;
 import org.apache.druid.metadata.TestDerbyConnector;
 import org.apache.druid.query.QueryRunner;
 import org.apache.druid.query.TableDataSource;
@@ -61,16 +65,19 @@ import org.apache.druid.timeline.DataSegment.PruneSpecsHolder;
 import org.apache.druid.timeline.SegmentId;
 import org.apache.druid.timeline.partition.NumberedShardSpec;
 import org.easymock.EasyMock;
+import org.joda.time.Period;
 import org.junit.After;
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Rule;
 import org.junit.Test;
+import org.mockito.Mockito;
 
 import javax.annotation.Nullable;
 import java.io.File;
 import java.util.ArrayList;
 import java.util.Collection;
+import java.util.Collections;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.List;
@@ -101,6 +108,8 @@ public class CoordinatorSegmentDataCacheConcurrencyTest extends SegmentMetadataC
   private TestSegmentMetadataQueryWalker walker;
   private SegmentSchemaCache segmentSchemaCache;
   private SegmentSchemaBackFillQueue backFillQueue;
+  private SqlSegmentsMetadataManager sqlSegmentsMetadataManager;
+  private Supplier<SegmentsMetadataManagerConfig> segmentsMetadataManagerConfigSupplier;
   private final ObjectMapper mapper = TestHelper.makeJsonMapper();
 
   @Before
@@ -190,6 +199,12 @@ public class CoordinatorSegmentDataCacheConcurrencyTest extends SegmentMetadataC
         }
     );
 
+    sqlSegmentsMetadataManager = Mockito.mock(SqlSegmentsMetadataManager.class);
+    Mockito.when(sqlSegmentsMetadataManager.getImmutableDataSourcesWithAllUsedSegments()).thenReturn(Collections.emptyList());
+    SegmentsMetadataManagerConfig metadataManagerConfig = Mockito.mock(SegmentsMetadataManagerConfig.class);
+    Mockito.when(metadataManagerConfig.getPollDuration()).thenReturn(Period.millis(1000));
+    segmentsMetadataManagerConfigSupplier = Suppliers.ofInstance(metadataManagerConfig);
+
     inventoryView.init();
     initLatch.await();
     exec = Execs.multiThreaded(4, "DruidSchemaConcurrencyTest-%d");
@@ -227,7 +242,9 @@ public class CoordinatorSegmentDataCacheConcurrencyTest extends SegmentMetadataC
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -341,7 +358,9 @@ public class CoordinatorSegmentDataCacheConcurrencyTest extends SegmentMetadataC
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
diff --git a/server/src/test/java/org/apache/druid/segment/metadata/CoordinatorSegmentMetadataCacheTest.java b/server/src/test/java/org/apache/druid/segment/metadata/CoordinatorSegmentMetadataCacheTest.java
index e5b6db1d42d..ef1fb1e8edd 100644
--- a/server/src/test/java/org/apache/druid/segment/metadata/CoordinatorSegmentMetadataCacheTest.java
+++ b/server/src/test/java/org/apache/druid/segment/metadata/CoordinatorSegmentMetadataCacheTest.java
@@ -22,11 +22,14 @@ package org.apache.druid.segment.metadata;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Preconditions;
+import com.google.common.base.Supplier;
+import com.google.common.base.Suppliers;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
 import com.google.common.collect.Sets;
 import org.apache.druid.client.DruidServer;
+import org.apache.druid.client.ImmutableDruidDataSource;
 import org.apache.druid.client.InternalQueryConfig;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.java.util.common.Intervals;
@@ -37,6 +40,8 @@ import org.apache.druid.java.util.common.guava.Sequences;
 import org.apache.druid.java.util.emitter.EmittingLogger;
 import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.apache.druid.metadata.MetadataStorageTablesConfig;
+import org.apache.druid.metadata.SegmentsMetadataManagerConfig;
+import org.apache.druid.metadata.SqlSegmentsMetadataManager;
 import org.apache.druid.metadata.TestDerbyConnector;
 import org.apache.druid.query.DruidMetrics;
 import org.apache.druid.query.QueryContexts;
@@ -66,6 +71,8 @@ import org.apache.druid.server.QueryLifecycleFactory;
 import org.apache.druid.server.QueryResponse;
 import org.apache.druid.server.coordination.DruidServerMetadata;
 import org.apache.druid.server.coordination.ServerType;
+import org.apache.druid.server.coordinator.loading.SegmentReplicaCount;
+import org.apache.druid.server.coordinator.loading.SegmentReplicationStatus;
 import org.apache.druid.server.metrics.NoopServiceEmitter;
 import org.apache.druid.server.security.Access;
 import org.apache.druid.server.security.AllowAllAuthenticator;
@@ -74,18 +81,23 @@ import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.SegmentId;
 import org.apache.druid.timeline.partition.LinearShardSpec;
 import org.easymock.EasyMock;
+import org.joda.time.Period;
 import org.junit.After;
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Test;
+import org.mockito.ArgumentMatchers;
+import org.mockito.Mockito;
 import org.skife.jdbi.v2.StatementContext;
 
 import java.io.File;
 import java.io.IOException;
 import java.sql.ResultSet;
 import java.util.ArrayList;
+import java.util.Arrays;
 import java.util.Collections;
 import java.util.EnumSet;
+import java.util.HashMap;
 import java.util.HashSet;
 import java.util.LinkedHashMap;
 import java.util.LinkedHashSet;
@@ -106,12 +118,19 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
   private CoordinatorSegmentMetadataCache runningSchema;
   private CountDownLatch buildTableLatch = new CountDownLatch(1);
   private CountDownLatch markDataSourceLatch = new CountDownLatch(1);
+  private SqlSegmentsMetadataManager sqlSegmentsMetadataManager;
+  private Supplier<SegmentsMetadataManagerConfig> segmentsMetadataManagerConfigSupplier;
 
   @Before
   @Override
   public void setUp() throws Exception
   {
     super.setUp();
+    sqlSegmentsMetadataManager = Mockito.mock(SqlSegmentsMetadataManager.class);
+    Mockito.when(sqlSegmentsMetadataManager.getImmutableDataSourcesWithAllUsedSegments()).thenReturn(Collections.emptyList());
+    SegmentsMetadataManagerConfig metadataManagerConfig = Mockito.mock(SegmentsMetadataManagerConfig.class);
+    Mockito.when(metadataManagerConfig.getPollDuration()).thenReturn(Period.millis(1000));
+    segmentsMetadataManagerConfigSupplier = Suppliers.ofInstance(metadataManagerConfig);
   }
 
   @After
@@ -132,6 +151,7 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
   public CoordinatorSegmentMetadataCache buildSchemaMarkAndTableLatch(SegmentMetadataCacheConfig config) throws InterruptedException
   {
     Preconditions.checkState(runningSchema == null);
+
     runningSchema = new CoordinatorSegmentMetadataCache(
         getQueryLifecycleFactory(walker),
         serverView,
@@ -140,7 +160,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -178,7 +200,7 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
   public void testGetTableMapFoo() throws InterruptedException
   {
     CoordinatorSegmentMetadataCache schema = buildSchemaMarkAndTableLatch();
-    verifyFooDSSchema(schema);
+    verifyFooDSSchema(schema, 6);
   }
 
   @Test
@@ -312,7 +334,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -523,7 +547,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -558,6 +584,11 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
   {
     String datasource = "newSegmentAddTest";
     CountDownLatch addSegmentLatch = new CountDownLatch(2);
+    SqlSegmentsMetadataManager sqlSegmentsMetadataManager = Mockito.mock(SqlSegmentsMetadataManager.class);
+    Mockito.when(sqlSegmentsMetadataManager.getImmutableDataSourcesWithAllUsedSegments()).thenReturn(Collections.emptyList());
+    SegmentsMetadataManagerConfig metadataManagerConfig = Mockito.mock(SegmentsMetadataManagerConfig.class);
+    Mockito.when(metadataManagerConfig.getPollDuration()).thenReturn(Period.millis(1000));
+    Supplier<SegmentsMetadataManagerConfig> segmentsMetadataManagerConfigSupplier = Suppliers.ofInstance(metadataManagerConfig);
     CoordinatorSegmentMetadataCache schema = new CoordinatorSegmentMetadataCache(
         getQueryLifecycleFactory(walker),
         serverView,
@@ -566,7 +597,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -605,6 +638,11 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
   {
     String datasource = "newSegmentAddTest";
     CountDownLatch addSegmentLatch = new CountDownLatch(1);
+    SqlSegmentsMetadataManager sqlSegmentsMetadataManager = Mockito.mock(SqlSegmentsMetadataManager.class);
+    Mockito.when(sqlSegmentsMetadataManager.getImmutableDataSourcesWithAllUsedSegments()).thenReturn(Collections.emptyList());
+    SegmentsMetadataManagerConfig metadataManagerConfig = Mockito.mock(SegmentsMetadataManagerConfig.class);
+    Mockito.when(metadataManagerConfig.getPollDuration()).thenReturn(Period.millis(1000));
+    Supplier<SegmentsMetadataManagerConfig> segmentsMetadataManagerConfigSupplier = Suppliers.ofInstance(metadataManagerConfig);
     CoordinatorSegmentMetadataCache schema = new CoordinatorSegmentMetadataCache(
         getQueryLifecycleFactory(walker),
         serverView,
@@ -613,7 +651,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -649,6 +689,11 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
   {
     String datasource = "newSegmentAddTest";
     CountDownLatch addSegmentLatch = new CountDownLatch(1);
+    SqlSegmentsMetadataManager sqlSegmentsMetadataManager = Mockito.mock(SqlSegmentsMetadataManager.class);
+    Mockito.when(sqlSegmentsMetadataManager.getImmutableDataSourcesWithAllUsedSegments()).thenReturn(Collections.emptyList());
+    SegmentsMetadataManagerConfig metadataManagerConfig = Mockito.mock(SegmentsMetadataManagerConfig.class);
+    Mockito.when(metadataManagerConfig.getPollDuration()).thenReturn(Period.millis(1000));
+    Supplier<SegmentsMetadataManagerConfig> segmentsMetadataManagerConfigSupplier = Suppliers.ofInstance(metadataManagerConfig);
     CoordinatorSegmentMetadataCache schema = new CoordinatorSegmentMetadataCache(
         getQueryLifecycleFactory(walker),
         serverView,
@@ -657,7 +702,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -698,7 +745,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -756,7 +805,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -817,7 +868,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -852,7 +905,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -900,7 +955,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -972,7 +1029,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         internalQueryConfig,
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     );
 
     Map<String, Object> queryContext = ImmutableMap.of(
@@ -1141,7 +1200,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         emitter,
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     )
     {
       @Override
@@ -1306,7 +1367,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     ) {
       @Override
       void updateSchemaForRealtimeSegments(SegmentSchemas segmentSchemas)
@@ -1385,7 +1448,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     ) {
       @Override
       public void refresh(Set<SegmentId> segmentsToRefresh, Set<String> dataSourcesToRebuild)
@@ -1565,7 +1630,9 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
         new InternalQueryConfig(),
         new NoopServiceEmitter(),
         segmentSchemaCache,
-        backFillQueue
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
     ) {
       @Override
       public Set<SegmentId> refreshSegmentsForDataSource(String dataSource, Set<SegmentId> segments)
@@ -1594,7 +1661,7 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
     Assert.assertEquals(0, refreshCount.get());
 
     // verify that datasource schema is built
-    verifyFooDSSchema(schema);
+    verifyFooDSSchema(schema, 6);
 
     serverView.addSegment(segment3, ServerType.HISTORICAL);
 
@@ -1721,12 +1788,384 @@ public class CoordinatorSegmentMetadataCacheTest extends CoordinatorSegmentMetad
     Assert.assertEquals(existingMetadata.getNumReplicas(), currentMetadata.getNumReplicas());
   }
 
-  private void verifyFooDSSchema(CoordinatorSegmentMetadataCache schema)
+  private CoordinatorSegmentMetadataCache setupForColdDatasourceSchemaTest()
+  {
+    // foo has both hot and cold segments
+    DataSegment coldSegment =
+        DataSegment.builder()
+                   .dataSource(DATASOURCE1)
+                   .interval(Intervals.of("1998/P2Y"))
+                   .version("1")
+                   .shardSpec(new LinearShardSpec(0))
+                   .size(0)
+                   .build();
+
+    // cold has only cold segments
+    DataSegment singleColdSegment =
+        DataSegment.builder()
+                   .dataSource("cold")
+                   .interval(Intervals.of("2000/P2Y"))
+                   .version("1")
+                   .shardSpec(new LinearShardSpec(0))
+                   .size(0)
+                   .build();
+
+    ImmutableMap.Builder<SegmentId, SegmentMetadata> segmentStatsMap = new ImmutableMap.Builder<>();
+    segmentStatsMap.put(coldSegment.getId(), new SegmentMetadata(20L, "foo-fingerprint"));
+    segmentStatsMap.put(singleColdSegment.getId(), new SegmentMetadata(20L, "cold-fingerprint"));
+    ImmutableMap.Builder<String, SchemaPayload> schemaPayloadMap = new ImmutableMap.Builder<>();
+    schemaPayloadMap.put(
+        "foo-fingerprint",
+        new SchemaPayload(RowSignature.builder()
+                                      .add("dim1", ColumnType.STRING)
+                                      .add("c1", ColumnType.STRING)
+                                      .add("c2", ColumnType.LONG)
+                                      .build())
+    );
+    schemaPayloadMap.put(
+        "cold-fingerprint",
+        new SchemaPayload(
+            RowSignature.builder()
+                              .add("f1", ColumnType.STRING)
+                              .add("f2", ColumnType.DOUBLE)
+                              .build()
+        )
+    );
+
+    segmentSchemaCache.updateFinalizedSegmentSchema(
+        new SegmentSchemaCache.FinalizedSegmentSchemaInfo(segmentStatsMap.build(), schemaPayloadMap.build())
+    );
+
+    List<ImmutableDruidDataSource> druidDataSources = new ArrayList<>();
+    Map<SegmentId, DataSegment> segmentMap = new HashMap<>();
+    segmentMap.put(coldSegment.getId(), coldSegment);
+    segmentMap.put(segment1.getId(), segment1);
+    segmentMap.put(segment2.getId(), segment2);
+    druidDataSources.add(new ImmutableDruidDataSource(
+        coldSegment.getDataSource(),
+        Collections.emptyMap(),
+        segmentMap
+    ));
+    druidDataSources.add(new ImmutableDruidDataSource(
+        singleColdSegment.getDataSource(),
+        Collections.emptyMap(),
+        Collections.singletonMap(singleColdSegment.getId(), singleColdSegment)
+    ));
+
+    Mockito.when(
+               sqlSegmentsMetadataManager.getImmutableDataSourcesWithAllUsedSegments())
+           .thenReturn(druidDataSources);
+
+    CoordinatorSegmentMetadataCache schema = new CoordinatorSegmentMetadataCache(
+        getQueryLifecycleFactory(walker),
+        serverView,
+        SEGMENT_CACHE_CONFIG_DEFAULT,
+        new NoopEscalator(),
+        new InternalQueryConfig(),
+        new NoopServiceEmitter(),
+        segmentSchemaCache,
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
+    );
+
+    SegmentReplicaCount zeroSegmentReplicaCount = Mockito.mock(SegmentReplicaCount.class);
+    SegmentReplicaCount nonZeroSegmentReplicaCount = Mockito.mock(SegmentReplicaCount.class);
+    Mockito.when(zeroSegmentReplicaCount.required()).thenReturn(0);
+    Mockito.when(nonZeroSegmentReplicaCount.required()).thenReturn(1);
+    SegmentReplicationStatus segmentReplicationStatus = Mockito.mock(SegmentReplicationStatus.class);
+    Mockito.when(segmentReplicationStatus.getReplicaCountsInCluster(ArgumentMatchers.eq(coldSegment.getId())))
+           .thenReturn(zeroSegmentReplicaCount);
+    Mockito.when(segmentReplicationStatus.getReplicaCountsInCluster(ArgumentMatchers.eq(singleColdSegment.getId())))
+           .thenReturn(zeroSegmentReplicaCount);
+    Mockito.when(segmentReplicationStatus.getReplicaCountsInCluster(ArgumentMatchers.eq(segment1.getId())))
+           .thenReturn(nonZeroSegmentReplicaCount);
+
+    Mockito.when(segmentReplicationStatus.getReplicaCountsInCluster(ArgumentMatchers.eq(segment2.getId())))
+           .thenReturn(nonZeroSegmentReplicaCount);
+
+    schema.updateSegmentReplicationStatus(segmentReplicationStatus);
+    schema.updateSegmentReplicationStatus(segmentReplicationStatus);
+
+    return schema;
+  }
+
+  @Test
+  public void testColdDatasourceSchema_refreshAfterColdSchemaExec() throws IOException
+  {
+    CoordinatorSegmentMetadataCache schema = setupForColdDatasourceSchemaTest();
+
+    schema.coldDatasourceSchemaExec();
+
+    Assert.assertEquals(new HashSet<>(Arrays.asList("foo", "cold")), schema.getDataSourceInformationMap().keySet());
+
+    // verify that cold schema for both foo and cold is present
+    RowSignature fooSignature = schema.getDatasource("foo").getRowSignature();
+    List<String> columnNames = fooSignature.getColumnNames();
+
+    // verify that foo schema doesn't contain columns from hot segments
+    Assert.assertEquals(3, columnNames.size());
+
+    Assert.assertEquals("dim1", columnNames.get(0));
+    Assert.assertEquals(ColumnType.STRING, fooSignature.getColumnType(columnNames.get(0)).get());
+
+    Assert.assertEquals("c1", columnNames.get(1));
+    Assert.assertEquals(ColumnType.STRING, fooSignature.getColumnType(columnNames.get(1)).get());
+
+    Assert.assertEquals("c2", columnNames.get(2));
+    Assert.assertEquals(ColumnType.LONG, fooSignature.getColumnType(columnNames.get(2)).get());
+
+    RowSignature coldSignature = schema.getDatasource("cold").getRowSignature();
+    columnNames = coldSignature.getColumnNames();
+    Assert.assertEquals("f1", columnNames.get(0));
+    Assert.assertEquals(ColumnType.STRING, coldSignature.getColumnType(columnNames.get(0)).get());
+
+    Assert.assertEquals("f2", columnNames.get(1));
+    Assert.assertEquals(ColumnType.DOUBLE, coldSignature.getColumnType(columnNames.get(1)).get());
+
+    Set<SegmentId> segmentIds = new HashSet<>();
+    segmentIds.add(segment1.getId());
+    segmentIds.add(segment2.getId());
+
+    schema.refresh(segmentIds, new HashSet<>());
+
+    Assert.assertEquals(new HashSet<>(Arrays.asList("foo", "cold")), schema.getDataSourceInformationMap().keySet());
+
+    coldSignature = schema.getDatasource("cold").getRowSignature();
+    columnNames = coldSignature.getColumnNames();
+    Assert.assertEquals("f1", columnNames.get(0));
+    Assert.assertEquals(ColumnType.STRING, coldSignature.getColumnType(columnNames.get(0)).get());
+
+    Assert.assertEquals("f2", columnNames.get(1));
+    Assert.assertEquals(ColumnType.DOUBLE, coldSignature.getColumnType(columnNames.get(1)).get());
+
+    // foo now contains schema from both hot and cold segments
+    verifyFooDSSchema(schema, 8);
+    RowSignature rowSignature = schema.getDatasource("foo").getRowSignature();
+
+    // cold columns should be present at the end
+    columnNames = rowSignature.getColumnNames();
+    Assert.assertEquals("c1", columnNames.get(6));
+    Assert.assertEquals(ColumnType.STRING, rowSignature.getColumnType(columnNames.get(6)).get());
+
+    Assert.assertEquals("c2", columnNames.get(7));
+    Assert.assertEquals(ColumnType.LONG, rowSignature.getColumnType(columnNames.get(7)).get());
+  }
+
+  @Test
+  public void testColdDatasourceSchema_coldSchemaExecAfterRefresh() throws IOException
+  {
+    CoordinatorSegmentMetadataCache schema = setupForColdDatasourceSchemaTest();
+
+    Set<SegmentId> segmentIds = new HashSet<>();
+    segmentIds.add(segment1.getId());
+    segmentIds.add(segment2.getId());
+
+    schema.refresh(segmentIds, new HashSet<>());
+    // cold datasource shouldn't be present
+    Assert.assertEquals(Collections.singleton("foo"), schema.getDataSourceInformationMap().keySet());
+
+    // cold columns shouldn't be present
+    verifyFooDSSchema(schema, 6);
+    Assert.assertNull(schema.getDatasource("cold"));
+
+    schema.coldDatasourceSchemaExec();
+
+    // could datasource should be present now
+    Assert.assertEquals(new HashSet<>(Arrays.asList("foo", "cold")), schema.getDataSourceInformationMap().keySet());
+
+    RowSignature coldSignature = schema.getDatasource("cold").getRowSignature();
+    List<String> columnNames = coldSignature.getColumnNames();
+    Assert.assertEquals("f1", columnNames.get(0));
+    Assert.assertEquals(ColumnType.STRING, coldSignature.getColumnType(columnNames.get(0)).get());
+
+    Assert.assertEquals("f2", columnNames.get(1));
+    Assert.assertEquals(ColumnType.DOUBLE, coldSignature.getColumnType(columnNames.get(1)).get());
+
+    // columns from cold datasource should be present
+    verifyFooDSSchema(schema, 8);
+    RowSignature rowSignature = schema.getDatasource("foo").getRowSignature();
+
+    columnNames = rowSignature.getColumnNames();
+    Assert.assertEquals("c1", columnNames.get(6));
+    Assert.assertEquals(ColumnType.STRING, rowSignature.getColumnType(columnNames.get(6)).get());
+
+    Assert.assertEquals("c2", columnNames.get(7));
+    Assert.assertEquals(ColumnType.LONG, rowSignature.getColumnType(columnNames.get(7)).get());
+  }
+
+  @Test
+  public void testColdDatasourceSchema_verifyStaleDatasourceRemoved()
+  {
+    DataSegment coldSegmentAlpha =
+        DataSegment.builder()
+                   .dataSource("alpha")
+                   .interval(Intervals.of("2000/P2Y"))
+                   .version("1")
+                   .shardSpec(new LinearShardSpec(0))
+                   .size(0)
+                   .build();
+
+    DataSegment coldSegmentBeta =
+        DataSegment.builder()
+                   .dataSource("beta")
+                   .interval(Intervals.of("2000/P2Y"))
+                   .version("1")
+                   .shardSpec(new LinearShardSpec(0))
+                   .size(0)
+                   .build();
+
+    DataSegment coldSegmentGamma =
+        DataSegment.builder()
+            .dataSource("gamma")
+            .interval(Intervals.of("2000/P2Y"))
+            .version("1")
+            .shardSpec(new LinearShardSpec(0))
+            .size(0)
+            .build();
+
+    DataSegment hotSegmentGamma =
+        DataSegment.builder()
+                   .dataSource("gamma")
+                   .interval(Intervals.of("2001/P2Y"))
+                   .version("1")
+                   .shardSpec(new LinearShardSpec(0))
+                   .size(0)
+                   .build();
+
+    ImmutableMap.Builder<SegmentId, SegmentMetadata> segmentStatsMap = new ImmutableMap.Builder<>();
+    segmentStatsMap.put(coldSegmentAlpha.getId(), new SegmentMetadata(20L, "cold"));
+    segmentStatsMap.put(coldSegmentBeta.getId(), new SegmentMetadata(20L, "cold"));
+    segmentStatsMap.put(hotSegmentGamma.getId(), new SegmentMetadata(20L, "hot"));
+    segmentStatsMap.put(coldSegmentGamma.getId(), new SegmentMetadata(20L, "cold"));
+
+    ImmutableMap.Builder<String, SchemaPayload> schemaPayloadMap = new ImmutableMap.Builder<>();
+    schemaPayloadMap.put(
+        "cold",
+        new SchemaPayload(RowSignature.builder()
+                                      .add("dim1", ColumnType.STRING)
+                                      .add("c1", ColumnType.STRING)
+                                      .add("c2", ColumnType.LONG)
+                                      .build())
+    );
+    schemaPayloadMap.put(
+        "hot",
+        new SchemaPayload(RowSignature.builder()
+                                      .add("c3", ColumnType.STRING)
+                                      .add("c4", ColumnType.STRING)
+                                      .build())
+    );
+    segmentSchemaCache.updateFinalizedSegmentSchema(
+        new SegmentSchemaCache.FinalizedSegmentSchemaInfo(segmentStatsMap.build(), schemaPayloadMap.build())
+    );
+
+    List<ImmutableDruidDataSource> druidDataSources = new ArrayList<>();
+    druidDataSources.add(
+        new ImmutableDruidDataSource(
+            "alpha",
+            Collections.emptyMap(),
+            Collections.singletonMap(coldSegmentAlpha.getId(), coldSegmentAlpha)
+        )
+    );
+
+    Map<SegmentId, DataSegment> gammaSegments = new HashMap<>();
+    gammaSegments.put(hotSegmentGamma.getId(), hotSegmentGamma);
+    gammaSegments.put(coldSegmentGamma.getId(), coldSegmentGamma);
+
+    druidDataSources.add(
+        new ImmutableDruidDataSource(
+            "gamma",
+            Collections.emptyMap(),
+            gammaSegments
+        )
+    );
+
+    Mockito.when(sqlSegmentsMetadataManager.getImmutableDataSourcesWithAllUsedSegments())
+           .thenReturn(druidDataSources);
+
+    CoordinatorSegmentMetadataCache schema = new CoordinatorSegmentMetadataCache(
+        getQueryLifecycleFactory(walker),
+        serverView,
+        SEGMENT_CACHE_CONFIG_DEFAULT,
+        new NoopEscalator(),
+        new InternalQueryConfig(),
+        new NoopServiceEmitter(),
+        segmentSchemaCache,
+        backFillQueue,
+        sqlSegmentsMetadataManager,
+        segmentsMetadataManagerConfigSupplier
+    );
+
+    SegmentReplicaCount zeroSegmentReplicaCount = Mockito.mock(SegmentReplicaCount.class);
+    SegmentReplicaCount nonZeroSegmentReplicaCount = Mockito.mock(SegmentReplicaCount.class);
+    Mockito.when(zeroSegmentReplicaCount.required()).thenReturn(0);
+    Mockito.when(nonZeroSegmentReplicaCount.required()).thenReturn(1);
+    SegmentReplicationStatus segmentReplicationStatus = Mockito.mock(SegmentReplicationStatus.class);
+    Mockito.when(segmentReplicationStatus.getReplicaCountsInCluster(ArgumentMatchers.eq(coldSegmentAlpha.getId())))
+           .thenReturn(zeroSegmentReplicaCount);
+    Mockito.when(segmentReplicationStatus.getReplicaCountsInCluster(ArgumentMatchers.eq(coldSegmentBeta.getId())))
+           .thenReturn(zeroSegmentReplicaCount);
+    Mockito.when(segmentReplicationStatus.getReplicaCountsInCluster(ArgumentMatchers.eq(coldSegmentGamma.getId())))
+           .thenReturn(zeroSegmentReplicaCount);
+
+    Mockito.when(segmentReplicationStatus.getReplicaCountsInCluster(ArgumentMatchers.eq(hotSegmentGamma.getId())))
+           .thenReturn(nonZeroSegmentReplicaCount);
+
+    schema.updateSegmentReplicationStatus(segmentReplicationStatus);
+
+    schema.coldDatasourceSchemaExec();
+    // alpha has only 1 cold segment
+    Assert.assertNotNull(schema.getDatasource("alpha"));
+    // gamma has both hot and cold segment
+    Assert.assertNotNull(schema.getDatasource("gamma"));
+    // assert that cold schema for gamma doesn't contain any columns from hot segment
+    RowSignature rowSignature = schema.getDatasource("gamma").getRowSignature();
+    Assert.assertTrue(rowSignature.contains("dim1"));
+    Assert.assertTrue(rowSignature.contains("c1"));
+    Assert.assertTrue(rowSignature.contains("c2"));
+    Assert.assertFalse(rowSignature.contains("c3"));
+    Assert.assertFalse(rowSignature.contains("c4"));
+
+    Assert.assertEquals(new HashSet<>(Arrays.asList("alpha", "gamma")), schema.getDataSourceInformationMap().keySet());
+
+    druidDataSources.clear();
+    druidDataSources.add(
+        new ImmutableDruidDataSource(
+            "beta",
+            Collections.emptyMap(),
+            Collections.singletonMap(coldSegmentBeta.getId(), coldSegmentBeta)
+        )
+    );
+
+    druidDataSources.add(
+        new ImmutableDruidDataSource(
+            "gamma",
+            Collections.emptyMap(),
+            Collections.singletonMap(hotSegmentGamma.getId(), hotSegmentGamma)
+        )
+    );
+
+    Mockito.when(sqlSegmentsMetadataManager.getImmutableDataSourcesWithAllUsedSegments())
+           .thenReturn(druidDataSources);
+
+    schema.coldDatasourceSchemaExec();
+    Assert.assertNotNull(schema.getDatasource("beta"));
+    // alpha doesn't have any segments
+    Assert.assertNull(schema.getDatasource("alpha"));
+    // gamma just has 1 hot segment
+    Assert.assertNull(schema.getDatasource("gamma"));
+
+    Assert.assertNull(schema.getDatasource("doesnotexist"));
+
+    Assert.assertEquals(Collections.singleton("beta"), schema.getDataSourceInformationMap().keySet());
+  }
+
+  private void verifyFooDSSchema(CoordinatorSegmentMetadataCache schema, int columns)
   {
     final DataSourceInformation fooDs = schema.getDatasource("foo");
     final RowSignature fooRowSignature = fooDs.getRowSignature();
     List<String> columnNames = fooRowSignature.getColumnNames();
-    Assert.assertEquals(6, columnNames.size());
+    Assert.assertEquals(columns, columnNames.size());
 
     Assert.assertEquals("__time", columnNames.get(0));
     Assert.assertEquals(ColumnType.LONG, fooRowSignature.getColumnType(columnNames.get(0)).get());
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCache.java b/sql/src/main/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCache.java
index 7974ed460eb..628b6ea3978 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCache.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCache.java
@@ -173,6 +173,16 @@ public class BrokerSegmentMetadataCache extends AbstractSegmentMetadataCache<Phy
     callbackExec.shutdownNow();
   }
 
+  /**
+   * Execute refresh on the broker in each cycle if CentralizedDatasourceSchema is enabled
+   * else if there are segments or datasources to be refreshed.
+   */
+  @Override
+  protected boolean shouldRefresh()
+  {
+    return centralizedDatasourceSchemaConfig.isEnabled() || super.shouldRefresh();
+  }
+
   /**
    * Refreshes the set of segments in two steps:
    * <ul>
@@ -196,6 +206,11 @@ public class BrokerSegmentMetadataCache extends AbstractSegmentMetadataCache<Phy
     // segmentMetadataInfo keys should be a superset of all other sets including datasources to refresh
     final Set<String> dataSourcesToQuery = new HashSet<>(segmentMetadataInfo.keySet());
 
+    // this is the complete set of datasources polled from the Coordinator
+    final Set<String> polledDatasources = queryDataSources();
+
+    dataSourcesToQuery.addAll(polledDatasources);
+
     log.debug("Querying schema for [%s] datasources from Coordinator.", dataSourcesToQuery);
 
     // Fetch datasource information from the Coordinator
@@ -227,14 +242,7 @@ public class BrokerSegmentMetadataCache extends AbstractSegmentMetadataCache<Phy
       // Remove those datasource for which we received schema from the Coordinator.
       dataSourcesToRebuild.removeAll(polledDataSourceMetadata.keySet());
 
-      if (centralizedDatasourceSchemaConfig.isEnabled()) {
-        // this is a hacky way to ensure refresh is executed even if there are no new segments to refresh
-        // once, CentralizedDatasourceSchema feature is GA, brokers should simply poll schema for all datasources
-        dataSourcesNeedingRebuild.addAll(segmentMetadataInfo.keySet());
-      } else {
-        dataSourcesNeedingRebuild.clear();
-      }
-      log.debug("DatasourcesNeedingRebuild are [%s]", dataSourcesNeedingRebuild);
+      dataSourcesNeedingRebuild.clear();
     }
 
     // Rebuild the datasources.
@@ -267,6 +275,23 @@ public class BrokerSegmentMetadataCache extends AbstractSegmentMetadataCache<Phy
     // noop, no additional action needed when segment is removed.
   }
 
+  private Set<String> queryDataSources()
+  {
+    Set<String> dataSources = new HashSet<>();
+
+    try {
+      Set<String> polled = FutureUtils.getUnchecked(coordinatorClient.fetchDataSourcesWithUsedSegments(), true);
+      if (polled != null) {
+        dataSources.addAll(polled);
+      }
+    }
+    catch (Exception e) {
+      log.debug(e, "Failed to query datasources from the Coordinator.");
+    }
+
+    return dataSources;
+  }
+
   private Map<String, PhysicalDatasourceMetadata> queryDataSourceInformation(Set<String> dataSourcesToQuery)
   {
     Stopwatch stopwatch = Stopwatch.createStarted();
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCacheTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCacheTest.java
index 23b2759286c..65610ce99f2 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCacheTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/schema/BrokerSegmentMetadataCacheTest.java
@@ -74,11 +74,13 @@ import org.apache.druid.server.security.NoopEscalator;
 import org.apache.druid.sql.calcite.table.DatasourceTable;
 import org.apache.druid.sql.calcite.table.DruidTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
+import org.apache.druid.sql.calcite.util.TestTimelineServerView;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.SegmentId;
 import org.apache.druid.timeline.partition.LinearShardSpec;
 import org.apache.druid.timeline.partition.NumberedShardSpec;
 import org.easymock.EasyMock;
+import org.joda.time.Period;
 import org.junit.After;
 import org.junit.Assert;
 import org.junit.Before;
@@ -332,6 +334,9 @@ public class BrokerSegmentMetadataCacheTest extends BrokerSegmentMetadataCacheTe
     ArgumentCaptor<Set<String>> argumentCaptor = ArgumentCaptor.forClass(Set.class);
     CoordinatorClient coordinatorClient = Mockito.mock(CoordinatorClient.class);
     Mockito.when(coordinatorClient.fetchDataSourceInformation(argumentCaptor.capture())).thenReturn(Futures.immediateFuture(null));
+
+    Set<String> datsources = Sets.newHashSet(DATASOURCE1, DATASOURCE2, DATASOURCE3, SOME_DATASOURCE, "xyz", "coldDS");
+    Mockito.when(coordinatorClient.fetchDataSourcesWithUsedSegments()).thenReturn(Futures.immediateFuture(datsources));
     BrokerSegmentMetadataCache schema = new BrokerSegmentMetadataCache(
         CalciteTests.createMockQueryLifecycleFactory(walker, conglomerate),
         serverView,
@@ -347,7 +352,7 @@ public class BrokerSegmentMetadataCacheTest extends BrokerSegmentMetadataCacheTe
     schema.start();
     schema.awaitInitialization();
 
-    Assert.assertEquals(Sets.newHashSet(DATASOURCE1, DATASOURCE2, DATASOURCE3, SOME_DATASOURCE), argumentCaptor.getValue());
+    Assert.assertEquals(datsources, argumentCaptor.getValue());
 
     refreshLatch = new CountDownLatch(1);
     serverView.addSegment(newSegment("xyz", 0), ServerType.HISTORICAL);
@@ -355,7 +360,87 @@ public class BrokerSegmentMetadataCacheTest extends BrokerSegmentMetadataCacheTe
     refreshLatch.await(WAIT_TIMEOUT_SECS, TimeUnit.SECONDS);
 
     // verify that previously refreshed are included in the last coordinator poll
-    Assert.assertEquals(Sets.newHashSet(DATASOURCE1, DATASOURCE2, DATASOURCE3, SOME_DATASOURCE, "xyz"), argumentCaptor.getValue());
+    Assert.assertEquals(datsources, argumentCaptor.getValue());
+  }
+
+  @Test
+  public void testRefreshOnEachCycleCentralizedDatasourceSchemaEnabled() throws InterruptedException
+  {
+    CentralizedDatasourceSchemaConfig config = CentralizedDatasourceSchemaConfig.create();
+    config.setEnabled(true);
+
+    serverView = new TestTimelineServerView(walker.getSegments(), Collections.emptyList());
+    druidServers = serverView.getDruidServers();
+
+    BrokerSegmentMetadataCacheConfig metadataCacheConfig = BrokerSegmentMetadataCacheConfig.create("PT1S");
+    metadataCacheConfig.setMetadataRefreshPeriod(Period.parse("PT0.001S"));
+    BrokerSegmentMetadataCache schema = new BrokerSegmentMetadataCache(
+        CalciteTests.createMockQueryLifecycleFactory(walker, conglomerate),
+        serverView,
+        SEGMENT_CACHE_CONFIG_DEFAULT,
+        new NoopEscalator(),
+        new InternalQueryConfig(),
+        new NoopServiceEmitter(),
+        new PhysicalDatasourceMetadataFactory(globalTableJoinable, segmentManager),
+        new NoopCoordinatorClient(),
+        config
+    ) {
+      @Override
+      public void refresh(Set<SegmentId> segmentsToRefresh, Set<String> dataSourcesToRebuild)
+          throws IOException
+      {
+        super.refresh(segmentsToRefresh, dataSourcesToRebuild);
+        refreshLatch.countDown();
+      }
+    };
+
+    // refresh should be executed more than once, with the feature disabled refresh should be executed only once
+    refreshLatch = new CountDownLatch(3);
+    schema.start();
+    schema.awaitInitialization();
+
+    refreshLatch.await(WAIT_TIMEOUT_SECS, TimeUnit.SECONDS);
+
+    Assert.assertEquals(0, refreshLatch.getCount());
+  }
+
+  @Test
+  public void testRefreshOnEachCycleCentralizedDatasourceSchemaDisabled() throws InterruptedException
+  {
+    BrokerSegmentMetadataCacheConfig metadataCacheConfig = BrokerSegmentMetadataCacheConfig.create("PT1S");
+    metadataCacheConfig.setMetadataRefreshPeriod(Period.parse("PT0.001S"));
+
+    serverView = new TestTimelineServerView(walker.getSegments(), Collections.emptyList());
+    druidServers = serverView.getDruidServers();
+
+    BrokerSegmentMetadataCache schema = new BrokerSegmentMetadataCache(
+        CalciteTests.createMockQueryLifecycleFactory(walker, conglomerate),
+        serverView,
+        SEGMENT_CACHE_CONFIG_DEFAULT,
+        new NoopEscalator(),
+        new InternalQueryConfig(),
+        new NoopServiceEmitter(),
+        new PhysicalDatasourceMetadataFactory(globalTableJoinable, segmentManager),
+        new NoopCoordinatorClient(),
+        CentralizedDatasourceSchemaConfig.create()
+    ) {
+      @Override
+      public void refresh(Set<SegmentId> segmentsToRefresh, Set<String> dataSourcesToRebuild)
+          throws IOException
+      {
+        super.refresh(segmentsToRefresh, dataSourcesToRebuild);
+        refreshLatch.countDown();
+      }
+    };
+
+    // refresh should be executed only once
+    refreshLatch = new CountDownLatch(3);
+    schema.start();
+    schema.awaitInitialization();
+
+    refreshLatch.await(WAIT_TIMEOUT_SECS, TimeUnit.SECONDS);
+
+    Assert.assertEquals(2, refreshLatch.getCount());
   }
 
   @Test

From 78a4a09d0181fc641f024d0c22dc6534803e7c76 Mon Sep 17 00:00:00 2001
From: Sree Charan Manamala <sree.manamala@imply.io>
Date: Mon, 15 Jul 2024 16:13:27 +0530
Subject: [PATCH 69/72] Window Function offset correction for RAC (#16718)

* When an ArrayList RAC creates a child RAC, the start and end offsets need to have the offset of parent's start offset
* Defaults the 2nd window bound to CURRENT ROW when only a single bound is specified
* Removes the windowingStrictValidation warning and throws a hard exception when Order By alongside RANGE clause is not provided with UNBOUNDED or CURRENT ROW as both bounds
---
 .../sql/VarianceSqlAggregatorTest.java        |  3 +-
 .../org/apache/druid/query/QueryContext.java  |  8 --
 .../org/apache/druid/query/QueryContexts.java |  2 -
 .../rowsandcols/ArrayListRowsAndColumns.java  |  4 +-
 .../apache/druid/query/QueryContextsTest.java |  9 --
 .../ArrayListRowsAndColumnsTest.java          | 39 ++++++++-
 .../calcite/planner/DruidSqlValidator.java    | 32 ++++----
 .../druid/sql/calcite/CalciteQueryTest.java   |  2 +-
 .../sql/calcite/CalciteWindowQueryTest.java   | 12 +--
 .../window/defaultBoundCurrentRow.sqlTest     | 82 +++++++++++++++++++
 .../tests/window/range_handling.sqlTest       | 17 ++--
 ...ipediaAggregationsMultipleOrdering.sqlTest |  8 +-
 ...iaAggregationsMultipleOrderingDesc.sqlTest |  2 +-
 .../wikipediaFramedAggregations.sqlTest       |  6 +-
 14 files changed, 158 insertions(+), 68 deletions(-)
 create mode 100644 sql/src/test/resources/calcite/tests/window/defaultBoundCurrentRow.sqlTest

diff --git a/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java b/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java
index f3e6406ecf3..687e26e9ff2 100644
--- a/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java
+++ b/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java
@@ -712,8 +712,7 @@ public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
             + "group by dim4, dim5, mod(m1, 3)")
         .queryContext(ImmutableMap.of(
             PlannerContext.CTX_ENABLE_WINDOW_FNS, true,
-            QueryContexts.ENABLE_DEBUG, true,
-            QueryContexts.WINDOWING_STRICT_VALIDATION, false
+            QueryContexts.ENABLE_DEBUG, true
         ))
         .expectedResults(ImmutableList.of(
             new Object[]{"a", "aa", 1.0D, 0.0D},
diff --git a/processing/src/main/java/org/apache/druid/query/QueryContext.java b/processing/src/main/java/org/apache/druid/query/QueryContext.java
index daa6760f8f3..8b2f7e27e68 100644
--- a/processing/src/main/java/org/apache/druid/query/QueryContext.java
+++ b/processing/src/main/java/org/apache/druid/query/QueryContext.java
@@ -613,14 +613,6 @@ public class QueryContext
     );
   }
 
-  public boolean isWindowingStrictValidation()
-  {
-    return getBoolean(
-        QueryContexts.WINDOWING_STRICT_VALIDATION,
-        QueryContexts.DEFAULT_WINDOWING_STRICT_VALIDATION
-    );
-  }
-
   public boolean isCatalogValidationEnabled()
   {
     return getBoolean(
diff --git a/processing/src/main/java/org/apache/druid/query/QueryContexts.java b/processing/src/main/java/org/apache/druid/query/QueryContexts.java
index 61520a04bc2..402001efe7d 100644
--- a/processing/src/main/java/org/apache/druid/query/QueryContexts.java
+++ b/processing/src/main/java/org/apache/druid/query/QueryContexts.java
@@ -87,7 +87,6 @@ public class QueryContexts
   public static final String SERIALIZE_DATE_TIME_AS_LONG_INNER_KEY = "serializeDateTimeAsLongInner";
   public static final String UNCOVERED_INTERVALS_LIMIT_KEY = "uncoveredIntervalsLimit";
   public static final String MIN_TOP_N_THRESHOLD = "minTopNThreshold";
-  public static final String WINDOWING_STRICT_VALIDATION = "windowingStrictValidation";
   public static final String CATALOG_VALIDATION_ENABLED = "catalogValidationEnabled";
   // Unique identifier for the query, that is used to map the global shared resources (specifically merge buffers) to the
   // query's runtime
@@ -126,7 +125,6 @@ public class QueryContexts
   public static final int DEFAULT_IN_FUNCTION_THRESHOLD = 100;
   public static final int DEFAULT_IN_FUNCTION_EXPR_THRESHOLD = 2;
   public static final boolean DEFAULT_ENABLE_TIME_BOUNDARY_PLANNING = false;
-  public static final boolean DEFAULT_WINDOWING_STRICT_VALIDATION = true;
   public static final boolean DEFAULT_CATALOG_VALIDATION_ENABLED = true;
 
   @SuppressWarnings("unused") // Used by Jackson serialization
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumns.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumns.java
index 6f546009511..04f9eddbff0 100644
--- a/processing/src/main/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumns.java
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumns.java
@@ -259,8 +259,8 @@ public class ArrayListRowsAndColumns<RowType> implements AppendableRowsAndColumn
         rowSignature,
         extraColumns,
         columnNames,
-        startOffset,
-        endOffset
+        this.startOffset + startOffset,
+        this.startOffset + endOffset
     );
   }
 
diff --git a/processing/src/test/java/org/apache/druid/query/QueryContextsTest.java b/processing/src/test/java/org/apache/druid/query/QueryContextsTest.java
index 2fa414188a1..554ca7b8f4a 100644
--- a/processing/src/test/java/org/apache/druid/query/QueryContextsTest.java
+++ b/processing/src/test/java/org/apache/druid/query/QueryContextsTest.java
@@ -151,15 +151,6 @@ public class QueryContextsTest
     );
   }
 
-  @Test
-  public void testDefaultWindowingStrictValidation()
-  {
-    Assert.assertEquals(
-        QueryContexts.DEFAULT_WINDOWING_STRICT_VALIDATION,
-        QueryContext.empty().isWindowingStrictValidation()
-    );
-  }
-
   @Test
   public void testCatalogValidationEnabled()
   {
diff --git a/processing/src/test/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumnsTest.java b/processing/src/test/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumnsTest.java
index dd492ae407f..b709678ec17 100644
--- a/processing/src/test/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumnsTest.java
+++ b/processing/src/test/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumnsTest.java
@@ -19,12 +19,18 @@
 
 package org.apache.druid.query.rowsandcols;
 
+import com.google.common.collect.ImmutableMap;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
 import org.apache.druid.segment.column.RowSignature;
+import org.junit.Assert;
+import org.junit.Test;
 
 import javax.annotation.Nonnull;
 import java.util.ArrayList;
+import java.util.Collections;
+import java.util.Objects;
 import java.util.function.Function;
 
 public class ArrayListRowsAndColumnsTest extends RowsAndColumnsTestBase
@@ -35,7 +41,10 @@ public class ArrayListRowsAndColumnsTest extends RowsAndColumnsTestBase
   }
 
   @Nonnull
-  public static Function<MapOfColumnsRowsAndColumns, ArrayListRowsAndColumns<Object[]>> MAKER = input -> {
+  public static Function<MapOfColumnsRowsAndColumns, ArrayListRowsAndColumns<Object[]>> MAKER = input -> buildRAC(input);
+
+  public static ArrayListRowsAndColumns<Object[]> buildRAC(MapOfColumnsRowsAndColumns input)
+  {
     ArrayList<Object[]> rows = new ArrayList<>(input.numRows());
 
     ArrayList<String> cols = new ArrayList<>(input.getColumnNames());
@@ -47,7 +56,7 @@ public class ArrayListRowsAndColumnsTest extends RowsAndColumnsTestBase
 
     for (int colIndex = 0; colIndex < cols.size(); ++colIndex) {
       String col = cols.get(colIndex);
-      final ColumnAccessor column = input.findColumn(col).toAccessor();
+      final ColumnAccessor column = Objects.requireNonNull(input.findColumn(col)).toAccessor();
       sigBob.add(col, column.getType());
 
       for (int i = 0; i < column.numRows(); ++i) {
@@ -66,5 +75,29 @@ public class ArrayListRowsAndColumnsTest extends RowsAndColumnsTestBase
         },
         sigBob.build()
     );
-  };
+  }
+
+  @Test
+  public void testChildRAC()
+  {
+    MapOfColumnsRowsAndColumns input = MapOfColumnsRowsAndColumns.fromMap(
+        ImmutableMap.of(
+            "colA", new IntArrayColumn(new int[]{1, 1, 1, 1, 2, 2, 2, 2, 2, 2}),
+            "colB", new IntArrayColumn(new int[]{3, 3, 4, 4, 5, 5, 5, 6, 6, 7})
+        )
+    );
+
+    ArrayListRowsAndColumns rac = ArrayListRowsAndColumnsTest.buildRAC(input);
+    ArrayList<RowsAndColumns> childRACs = rac.toClusteredGroupPartitioner()
+                                             .partitionOnBoundaries(Collections.singletonList("colA"));
+
+    Assert.assertEquals(2, childRACs.size());
+    ArrayListRowsAndColumns childRAC = (ArrayListRowsAndColumns) childRACs.get(1);
+    ArrayListRowsAndColumns curChildRAC = (ArrayListRowsAndColumns) childRAC.toClusteredGroupPartitioner()
+                                                                            .partitionOnBoundaries(Collections.singletonList(
+                                                                                "colB"))
+                                                                            .get(0);
+
+    Assert.assertEquals(5, curChildRAC.findColumn("colB").toAccessor().getInt(0));
+  }
 }
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidSqlValidator.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidSqlValidator.java
index d399786676c..75778daf559 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidSqlValidator.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidSqlValidator.java
@@ -61,7 +61,6 @@ import org.apache.druid.error.InvalidSqlInput;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.Granularity;
 import org.apache.druid.query.QueryContext;
-import org.apache.druid.query.QueryContexts;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.Types;
 import org.apache.druid.segment.column.ValueType;
@@ -123,7 +122,6 @@ public class DruidSqlValidator extends BaseDruidSqlValidator
         throw Util.unexpected(windowOrId.getKind());
     }
 
-
     @Nullable
     SqlNode lowerBound = targetWindow.getLowerBound();
     @Nullable
@@ -135,6 +133,17 @@ public class DruidSqlValidator extends BaseDruidSqlValidator
       );
     }
 
+    if (lowerBound != null && upperBound == null) {
+      if (lowerBound.getKind() == SqlKind.FOLLOWING || SqlWindow.isUnboundedFollowing(lowerBound)) {
+        upperBound = lowerBound;
+        lowerBound = SqlWindow.createCurrentRow(SqlParserPos.ZERO);
+      } else {
+        upperBound = SqlWindow.createCurrentRow(SqlParserPos.ZERO);
+      }
+      targetWindow.setLowerBound(lowerBound);
+      targetWindow.setUpperBound(upperBound);
+    }
+
     boolean hasBounds = lowerBound != null || upperBound != null;
     if (call.getKind() == SqlKind.NTILE && hasBounds) {
       throw buildCalciteContextException(
@@ -152,18 +161,13 @@ public class DruidSqlValidator extends BaseDruidSqlValidator
       }
     }
 
-    if (plannerContext.queryContext().isWindowingStrictValidation()) {
-      if (!targetWindow.isRows() &&
-          (!isUnboundedOrCurrent(lowerBound) || !isUnboundedOrCurrent(upperBound))) {
-        // this limitation can be lifted when https://github.com/apache/druid/issues/15767 is addressed
-        throw buildCalciteContextException(
-            StringUtils.format(
-                "The query contains a window frame which may return incorrect results. To disregard this warning, set [%s] to false in the query context.",
-                QueryContexts.WINDOWING_STRICT_VALIDATION
-            ),
-            windowOrId
-        );
-      }
+    if (!targetWindow.isRows() &&
+        (!isUnboundedOrCurrent(lowerBound) || !isUnboundedOrCurrent(upperBound))) {
+      // this limitation can be lifted when https://github.com/apache/druid/issues/15767 is addressed
+      throw buildCalciteContextException(
+          "Order By with RANGE clause currently supports only UNBOUNDED or CURRENT ROW. Use ROWS clause instead.",
+          windowOrId
+      );
     }
 
     super.validateWindow(windowOrId, scope, call);
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
index ec40fb3f871..2ae095d41c7 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
@@ -15546,7 +15546,7 @@ public class CalciteQueryTest extends BaseCalciteQueryTest
         .queryContext(ImmutableMap.of(PlannerContext.CTX_ENABLE_WINDOW_FNS, true))
         .sql("SELECT dim1,ROW_NUMBER() OVER (ORDER BY dim1 RANGE BETWEEN 3 PRECEDING AND 2 FOLLOWING) from druid.foo")
         .run());
-    assertThat(e, invalidSqlIs("The query contains a window frame which may return incorrect results. To disregard this warning, set [windowingStrictValidation] to false in the query context. (line [1], column [31])"));
+    assertThat(e, invalidSqlIs("Order By with RANGE clause currently supports only UNBOUNDED or CURRENT ROW. Use ROWS clause instead. (line [1], column [31])"));
   }
 
   @Test
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java
index cdc4bc9cbf9..b3d657b148f 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java
@@ -201,8 +201,7 @@ public class CalciteWindowQueryTest extends BaseCalciteQueryTest
           .sql(testCase.getSql())
           .queryContext(ImmutableMap.of(
               PlannerContext.CTX_ENABLE_WINDOW_FNS, true,
-              QueryContexts.ENABLE_DEBUG, true,
-              QueryContexts.WINDOWING_STRICT_VALIDATION, false
+              QueryContexts.ENABLE_DEBUG, true
               ))
           .addCustomVerification(QueryVerification.ofResults(testCase))
           .run();
@@ -224,8 +223,7 @@ public class CalciteWindowQueryTest extends BaseCalciteQueryTest
           .sql(testCase.getSql())
           .queryContext(ImmutableMap.of(QueryContexts.ENABLE_DEBUG, true,
                                         PlannerContext.CTX_ENABLE_WINDOW_FNS, true,
-                                        QueryContexts.MAX_SUBQUERY_BYTES_KEY, "100000",
-                                        QueryContexts.WINDOWING_STRICT_VALIDATION, false
+                                        QueryContexts.MAX_SUBQUERY_BYTES_KEY, "100000"
                         )
           )
           .addCustomVerification(QueryVerification.ofResults(testCase))
@@ -246,8 +244,7 @@ public class CalciteWindowQueryTest extends BaseCalciteQueryTest
         )
         .queryContext(ImmutableMap.of(
             PlannerContext.CTX_ENABLE_WINDOW_FNS, true,
-            QueryContexts.ENABLE_DEBUG, true,
-            QueryContexts.WINDOWING_STRICT_VALIDATION, false
+            QueryContexts.ENABLE_DEBUG, true
         ))
         .expectedResults(ImmutableList.of(
             new Object[]{1L},
@@ -269,8 +266,7 @@ public class CalciteWindowQueryTest extends BaseCalciteQueryTest
              "FROM \"wikipedia\"")
         .queryContext(ImmutableMap.of(
             PlannerContext.CTX_ENABLE_WINDOW_FNS, true,
-            QueryContexts.ENABLE_DEBUG, true,
-            QueryContexts.WINDOWING_STRICT_VALIDATION, false
+            QueryContexts.ENABLE_DEBUG, true
         ))
         .expectedResults(ImmutableList.of(
             new Object[]{1L, 1L}
diff --git a/sql/src/test/resources/calcite/tests/window/defaultBoundCurrentRow.sqlTest b/sql/src/test/resources/calcite/tests/window/defaultBoundCurrentRow.sqlTest
new file mode 100644
index 00000000000..d5a324c9e2d
--- /dev/null
+++ b/sql/src/test/resources/calcite/tests/window/defaultBoundCurrentRow.sqlTest
@@ -0,0 +1,82 @@
+type: "operatorValidation"
+
+sql: |
+  SELECT
+    dim2,
+    count(*) OVER (partition by dim2 ORDER BY dim1 ROWS UNBOUNDED PRECEDING),
+    count(*) OVER (partition by dim2 ORDER BY dim1 ROWS 1 PRECEDING),
+    count(*) OVER (partition by dim2 ORDER BY dim1 ROWS CURRENT ROW),
+    count(*) OVER (partition by dim2 ORDER BY dim1 ROWS 1 FOLLOWING),
+    count(*) OVER (partition by dim2 ORDER BY dim1 ROWS UNBOUNDED FOLLOWING)
+  FROM numfoo
+  WHERE dim2 IN ('a', 'abc')
+  GROUP BY dim2, dim1
+
+expectedOperators:
+  - {"type":"naiveSort","columns":[{"column":"_d1","direction":"ASC"},{"column":"_d0","direction":"ASC"}]}
+  - { type: "naivePartition", partitionColumns: [ "_d1" ] }
+  - type: "window"
+    processor:
+      type: "framedAgg"
+      frame:
+          peerType: "ROWS"
+          lowUnbounded: true
+          lowOffset: 0
+          uppUnbounded: false
+          uppOffset: 0
+          orderBy: null
+      aggregations:
+        - { type: "count", name: "w0" }
+  - type: "window"
+    processor:
+      type: "framedAgg"
+      frame:
+          peerType: "ROWS"
+          lowUnbounded: false
+          lowOffset: -1
+          uppUnbounded: false
+          uppOffset: 0
+          orderBy: null
+      aggregations:
+        - { type: "count", name: "w1" }
+  - type: "window"
+    processor:
+      type: "framedAgg"
+      frame:
+          peerType: "ROWS"
+          lowUnbounded: false
+          lowOffset: 0
+          uppUnbounded: false
+          uppOffset: 0
+          orderBy: null
+      aggregations:
+        - { type: "count", name: "w2" }
+  - type: "window"
+    processor:
+      type: "framedAgg"
+      frame:
+          peerType: "ROWS"
+          lowUnbounded: false
+          lowOffset: 0
+          uppUnbounded: false
+          uppOffset: 1
+          orderBy: null
+      aggregations:
+        - { type: "count", name: "w3" }
+  - type: "window"
+    processor:
+      type: "framedAgg"
+      frame:
+          peerType: "ROWS"
+          lowUnbounded: false
+          lowOffset: 0
+          uppUnbounded: true
+          uppOffset: 0
+          orderBy: null
+      aggregations:
+        - { type: "count", name: "w4" }
+
+expectedResults:
+  - ["a",1,1,1,2,2]
+  - ["a",2,2,1,1,1]
+  - ["abc",1,1,1,1,1]
diff --git a/sql/src/test/resources/calcite/tests/window/range_handling.sqlTest b/sql/src/test/resources/calcite/tests/window/range_handling.sqlTest
index 717778d1fe2..405886af230 100644
--- a/sql/src/test/resources/calcite/tests/window/range_handling.sqlTest
+++ b/sql/src/test/resources/calcite/tests/window/range_handling.sqlTest
@@ -9,16 +9,13 @@ sql: |
     COUNT(1) OVER (ORDER BY FLOOR(m1/3) RANGE BETWEEN UNBOUNDED PRECEDING AND CURRENT ROW),
     'postfix',
     COUNT(1) OVER (ORDER BY FLOOR(m1/3) ROWS BETWEEN CURRENT ROW AND UNBOUNDED FOLLOWING),
-    COUNT(1) OVER (ORDER BY FLOOR(m1/3) RANGE BETWEEN CURRENT ROW AND UNBOUNDED FOLLOWING),
-    'k(1)',
-    COUNT(1) OVER (ORDER BY FLOOR(m1/3) ROWS BETWEEN 1 PRECEDING AND 1 FOLLOWING),
-    COUNT(1) OVER (ORDER BY FLOOR(m1/3) RANGE BETWEEN 1 PRECEDING AND 1 FOLLOWING)
+    COUNT(1) OVER (ORDER BY FLOOR(m1/3) RANGE BETWEEN CURRENT ROW AND UNBOUNDED FOLLOWING)
   FROM foo
 
 expectedResults:
-  - [0.0,1,"prefix",1,2,"postfix",6,6,"k(1)",2,5]
-  - [0.0,1,"prefix",2,2,"postfix",5,6,"k(1)",3,5]
-  - [1.0,2,"prefix",3,5,"postfix",4,4,"k(1)",3,6]
-  - [1.0,2,"prefix",4,5,"postfix",3,4,"k(1)",3,6]
-  - [1.0,2,"prefix",5,5,"postfix",2,4,"k(1)",3,6]
-  - [2.0,3,"prefix",6,6,"postfix",1,1,"k(1)",2,4]
+  - [0.0,1,"prefix",1,2,"postfix",6,6]
+  - [0.0,1,"prefix",2,2,"postfix",5,6]
+  - [1.0,2,"prefix",3,5,"postfix",4,4]
+  - [1.0,2,"prefix",4,5,"postfix",3,4]
+  - [1.0,2,"prefix",5,5,"postfix",2,4]
+  - [2.0,3,"prefix",6,6,"postfix",1,1]
diff --git a/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrdering.sqlTest b/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrdering.sqlTest
index b8da0dbd658..cc59868482a 100644
--- a/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrdering.sqlTest
+++ b/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrdering.sqlTest
@@ -5,7 +5,7 @@ sql: |
       countryIsoCode, 
       CAST (FLOOR(__time TO HOUR) AS BIGINT) t,
       SUM(delta) delta,
-      SUM(SUM(delta)) OVER (PARTITION BY countryIsoCode ORDER BY CAST (FLOOR(__time TO HOUR) AS BIGINT) RANGE BETWEEN 3 PRECEDING AND 2 FOLLOWING) windowedDelta,
+      SUM(SUM(delta)) OVER (PARTITION BY countryIsoCode ORDER BY CAST (FLOOR(__time TO HOUR) AS BIGINT) ROWS BETWEEN 3 PRECEDING AND 2 FOLLOWING) windowedDelta,
       ROW_NUMBER() OVER (PARTITION BY CAST (FLOOR(__time TO HOUR) AS BIGINT) ORDER BY SUM(delta)) AS hourlyRank
     FROM wikipedia
     GROUP BY 1, 2
@@ -16,14 +16,12 @@ expectedOperators:
     processor:
       type: "framedAgg"
       frame:
-        peerType: "RANGE"
+        peerType: "ROWS"
         lowUnbounded: false
         lowOffset: -3
         uppUnbounded: false
         uppOffset: 2
-        orderBy:
-          - column: d1
-            direction: ASC
+        orderBy: null
       aggregations:
         - { type: "longSum", name: "w0", fieldName: "a0" }
   - { type: "naiveSort", columns: [ { column: "d1", direction: "ASC" }, { column: "a0", direction: "ASC"} ]}
diff --git a/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrderingDesc.sqlTest b/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrderingDesc.sqlTest
index 0180f615313..b16aa21d303 100644
--- a/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrderingDesc.sqlTest
+++ b/sql/src/test/resources/calcite/tests/window/wikipediaAggregationsMultipleOrderingDesc.sqlTest
@@ -5,7 +5,7 @@ sql: |
       countryIsoCode, 
       CAST (FLOOR(__time TO HOUR) AS BIGINT) t,
       SUM(delta) delta,
-      SUM(SUM(delta)) OVER (PARTITION BY countryIsoCode ORDER BY CAST (FLOOR(__time TO HOUR) AS BIGINT) DESC RANGE BETWEEN 3 PRECEDING AND 2 FOLLOWING) windowedDelta,
+      SUM(SUM(delta)) OVER (PARTITION BY countryIsoCode ORDER BY CAST (FLOOR(__time TO HOUR) AS BIGINT) DESC ROWS BETWEEN 3 PRECEDING AND 2 FOLLOWING) windowedDelta,
       ROW_NUMBER() OVER (PARTITION BY CAST (FLOOR(__time TO HOUR) AS BIGINT) ORDER BY SUM(delta) DESC) AS hourlyRank
     FROM wikipedia
     GROUP BY 1, 2
diff --git a/sql/src/test/resources/calcite/tests/window/wikipediaFramedAggregations.sqlTest b/sql/src/test/resources/calcite/tests/window/wikipediaFramedAggregations.sqlTest
index 07cfadfb680..c25f1ff0352 100644
--- a/sql/src/test/resources/calcite/tests/window/wikipediaFramedAggregations.sqlTest
+++ b/sql/src/test/resources/calcite/tests/window/wikipediaFramedAggregations.sqlTest
@@ -5,7 +5,7 @@ sql: |
       countryIsoCode, 
       CAST (FLOOR(__time TO HOUR) AS BIGINT) t,
       SUM(delta) delta, 
-      SUM(SUM(delta)) OVER (PARTITION BY countryIsoCode ORDER BY CAST (FLOOR(__time TO HOUR) AS BIGINT) RANGE BETWEEN 3 PRECEDING AND 2 FOLLOWING) windowedDelta
+      SUM(SUM(delta)) OVER (PARTITION BY countryIsoCode ORDER BY CAST (FLOOR(__time TO HOUR) AS BIGINT) ROWS BETWEEN 3 PRECEDING AND 2 FOLLOWING) windowedDelta
     FROM wikipedia
     GROUP BY 1, 2
 
@@ -15,12 +15,12 @@ expectedOperators:
     processor:
       type: "framedAgg"
       frame:
-          peerType: "RANGE"
+          peerType: "ROWS"
           lowUnbounded: false
           lowOffset: -3
           uppUnbounded: false
           uppOffset: 2
-          orderBy: [ {column: "d1", direction: ASC} ]
+          orderBy: null
       aggregations:
         - { type: "longSum", name: "w0", fieldName: "a0" }
 

From 6891866c4341a66074db3908204bcf673f30143f Mon Sep 17 00:00:00 2001
From: AmatyaAvadhanula <amatya.avadhanula@imply.io>
Date: Mon, 15 Jul 2024 18:24:23 +0530
Subject: [PATCH 70/72] Process retrieval of parent and child segment ids in
 batches (#16734)

---
 .../IndexerSQLMetadataStorageCoordinator.java | 99 ++++++++++---------
 ...exerSQLMetadataStorageCoordinatorTest.java | 93 +++++++++++++++++
 2 files changed, 144 insertions(+), 48 deletions(-)

diff --git a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
index 54f75ccb920..ecfad572e74 100644
--- a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
@@ -2954,28 +2954,30 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
       return Collections.emptyMap();
     }
 
-    final List<String> segmentIdList = ImmutableList.copyOf(segmentIds);
-    final String sql = StringUtils.format(
-        "SELECT id, upgraded_from_segment_id FROM %s WHERE dataSource = :dataSource %s",
-        dbTables.getSegmentsTable(),
-        SqlSegmentsMetadataQuery.getParameterizedInConditionForColumn("id", segmentIdList)
-    );
     final Map<String, String> upgradedFromSegmentIds = new HashMap<>();
-    connector.retryWithHandle(
-        handle -> {
-          Query<Map<String, Object>> query = handle.createQuery(sql)
-                                                   .bind("dataSource", dataSource);
-          SqlSegmentsMetadataQuery.bindColumnValuesToQueryWithInCondition("id", segmentIdList, query);
-          return query.map((index, r, ctx) -> {
-            final String id = r.getString(1);
-            final String upgradedFromSegmentId = r.getString(2);
-            if (upgradedFromSegmentId != null) {
-              upgradedFromSegmentIds.put(id, upgradedFromSegmentId);
-            }
-            return null;
-          }).list();
-        }
-    );
+    final List<List<String>> partitions = Lists.partition(ImmutableList.copyOf(segmentIds), 100);
+    for (List<String> partition : partitions) {
+      final String sql = StringUtils.format(
+          "SELECT id, upgraded_from_segment_id FROM %s WHERE dataSource = :dataSource %s",
+          dbTables.getSegmentsTable(),
+          SqlSegmentsMetadataQuery.getParameterizedInConditionForColumn("id", partition)
+      );
+      connector.retryWithHandle(
+          handle -> {
+            Query<Map<String, Object>> query = handle.createQuery(sql)
+                                                     .bind("dataSource", dataSource);
+            SqlSegmentsMetadataQuery.bindColumnValuesToQueryWithInCondition("id", partition, query);
+            return query.map((index, r, ctx) -> {
+              final String id = r.getString(1);
+              final String upgradedFromSegmentId = r.getString(2);
+              if (upgradedFromSegmentId != null) {
+                upgradedFromSegmentIds.put(id, upgradedFromSegmentId);
+              }
+              return null;
+            }).list();
+          }
+      );
+    }
     return upgradedFromSegmentIds;
   }
 
@@ -2989,39 +2991,40 @@ public class IndexerSQLMetadataStorageCoordinator implements IndexerMetadataStor
       return Collections.emptyMap();
     }
 
-    final List<String> upgradedFromSegmentIdList = ImmutableList.copyOf(segmentIds);
-    final String sql = StringUtils.format(
-        "SELECT id, upgraded_from_segment_id FROM %s WHERE dataSource = :dataSource %s",
-        dbTables.getSegmentsTable(),
-        SqlSegmentsMetadataQuery.getParameterizedInConditionForColumn(
-            "upgraded_from_segment_id",
-            upgradedFromSegmentIdList
-        )
-    );
     final Map<String, Set<String>> upgradedToSegmentIds = new HashMap<>();
     retrieveSegmentsById(dataSource, segmentIds)
         .stream()
         .map(DataSegment::getId)
         .map(SegmentId::toString)
         .forEach(id -> upgradedToSegmentIds.computeIfAbsent(id, k -> new HashSet<>()).add(id));
-    connector.retryWithHandle(
-        handle -> {
-          Query<Map<String, Object>> query = handle.createQuery(sql)
-                                                   .bind("dataSource", dataSource);
-          SqlSegmentsMetadataQuery.bindColumnValuesToQueryWithInCondition(
-              "upgraded_from_segment_id",
-              upgradedFromSegmentIdList,
-              query
-          );
-          return query.map((index, r, ctx) -> {
-            final String upgradedToId = r.getString(1);
-            final String id = r.getString(2);
-            upgradedToSegmentIds.computeIfAbsent(id, k -> new HashSet<>())
-                                .add(upgradedToId);
-            return null;
-          }).list();
-        }
-    );
+
+    final List<List<String>> partitions = Lists.partition(ImmutableList.copyOf(segmentIds), 100);
+    for (List<String> partition : partitions) {
+      final String sql = StringUtils.format(
+          "SELECT id, upgraded_from_segment_id FROM %s WHERE dataSource = :dataSource %s",
+          dbTables.getSegmentsTable(),
+          SqlSegmentsMetadataQuery.getParameterizedInConditionForColumn("upgraded_from_segment_id", partition)
+      );
+
+      connector.retryWithHandle(
+          handle -> {
+            Query<Map<String, Object>> query = handle.createQuery(sql)
+                                                     .bind("dataSource", dataSource);
+            SqlSegmentsMetadataQuery.bindColumnValuesToQueryWithInCondition(
+                "upgraded_from_segment_id",
+                partition,
+                query
+            );
+            return query.map((index, r, ctx) -> {
+              final String upgradedToId = r.getString(1);
+              final String id = r.getString(2);
+              upgradedToSegmentIds.computeIfAbsent(id, k -> new HashSet<>())
+                                  .add(upgradedToId);
+              return null;
+            }).list();
+          }
+      );
+    }
     return upgradedToSegmentIds;
   }
 
diff --git a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
index f352d5e2609..6eccbccaa84 100644
--- a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
+++ b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
@@ -3452,6 +3452,48 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
     );
   }
 
+  @Test
+  public void testRetrieveUpgradedFromSegmentIdsInBatches()
+  {
+    final int size = 500;
+    final int batchSize = 100;
+
+    List<DataSegment> segments = new ArrayList<>();
+    for (int i = 0; i < size; i++) {
+      segments.add(
+          new DataSegment(
+              "DS",
+              Intervals.ETERNITY,
+              "v " + (i % 5),
+              ImmutableMap.of("num", i / 5),
+              ImmutableList.of("dim"),
+              ImmutableList.of("agg"),
+              new NumberedShardSpec(i / 5, 0),
+              0,
+              100L
+          )
+      );
+    }
+    Map<String, String> expected = new HashMap<>();
+    for (int i = 0; i < batchSize; i++) {
+      for (int j = 1; j < 5; j++) {
+        expected.put(
+            segments.get(5 * i + j).getId().toString(),
+            segments.get(5 * i).getId().toString()
+        );
+      }
+    }
+    insertUsedSegments(ImmutableSet.copyOf(segments), expected);
+
+    Map<String, String> actual = coordinator.retrieveUpgradedFromSegmentIds(
+        "DS",
+        segments.stream().map(DataSegment::getId).map(SegmentId::toString).collect(Collectors.toSet())
+    );
+
+    Assert.assertEquals(400, actual.size());
+    Assert.assertEquals(expected, actual);
+  }
+
   @Test
   public void testRetrieveUpgradedToSegmentIds()
   {
@@ -3478,6 +3520,57 @@ public class IndexerSQLMetadataStorageCoordinatorTest extends IndexerSqlMetadata
     );
   }
 
+  @Test
+  public void testRetrieveUpgradedToSegmentIdsInBatches()
+  {
+    final int size = 500;
+    final int batchSize = 100;
+
+    List<DataSegment> segments = new ArrayList<>();
+    for (int i = 0; i < size; i++) {
+      segments.add(
+          new DataSegment(
+              "DS",
+              Intervals.ETERNITY,
+              "v " + (i % 5),
+              ImmutableMap.of("num", i / 5),
+              ImmutableList.of("dim"),
+              ImmutableList.of("agg"),
+              new NumberedShardSpec(i / 5, 0),
+              0,
+              100L
+          )
+      );
+    }
+
+    Map<String, Set<String>> expected = new HashMap<>();
+    for (DataSegment segment : segments) {
+      final String id = segment.getId().toString();
+      expected.put(id, new HashSet<>());
+      expected.get(id).add(id);
+    }
+    Map<String, String> upgradeMap = new HashMap<>();
+    for (int i = 0; i < batchSize; i++) {
+      for (int j = 1; j < 5; j++) {
+        upgradeMap.put(
+            segments.get(5 * i + j).getId().toString(),
+            segments.get(5 * i).getId().toString()
+        );
+        expected.get(segments.get(5 * i).getId().toString())
+                .add(segments.get(5 * i + j).getId().toString());
+      }
+    }
+    insertUsedSegments(ImmutableSet.copyOf(segments), upgradeMap);
+
+    Map<String, Set<String>> actual = coordinator.retrieveUpgradedToSegmentIds(
+        "DS",
+        segments.stream().map(DataSegment::getId).map(SegmentId::toString).collect(Collectors.toSet())
+    );
+
+    Assert.assertEquals(500, actual.size());
+    Assert.assertEquals(expected, actual);
+  }
+
   private void insertUsedSegments(Set<DataSegment> segments, Map<String, String> upgradedFromSegmentIdMap)
   {
     final String table = derbyConnectorRule.metadataTablesConfigSupplier().get().getSegmentsTable();

From 6cf6838eb974634ce5ae664d5ca877d8c804036a Mon Sep 17 00:00:00 2001
From: Adithya Chakilam <35785271+adithyachakilam@users.noreply.github.com>
Date: Mon, 15 Jul 2024 16:35:11 -0500
Subject: [PATCH 71/72] kubernetes-overlord-extension: Fix tasks not being
 shutdown (#16711)

---
 .../k8s/overlord/KubernetesTaskRunner.java     | 14 ++++++++++----
 .../k8s/overlord/KubernetesTaskRunnerTest.java | 18 ++++++++++++++++++
 2 files changed, 28 insertions(+), 4 deletions(-)

diff --git a/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/KubernetesTaskRunner.java b/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/KubernetesTaskRunner.java
index 080a0fdaa98..c324b49e13a 100644
--- a/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/KubernetesTaskRunner.java
+++ b/extensions-contrib/kubernetes-overlord-extensions/src/main/java/org/apache/druid/k8s/overlord/KubernetesTaskRunner.java
@@ -443,11 +443,17 @@ public class KubernetesTaskRunner implements TaskLogStreamer, TaskRunner
   @Override
   public TaskLocation getTaskLocation(String taskId)
   {
-    final KubernetesWorkItem workItem = tasks.get(taskId);
-    if (workItem == null) {
+    try {
+      final KubernetesWorkItem workItem = tasks.get(taskId);
+      if (workItem == null) {
+        return TaskLocation.unknown();
+      } else {
+        return workItem.getLocation();
+      }
+    }
+    catch (Exception e) {
+      log.warn("Unable to find location for task [%s]", taskId);
       return TaskLocation.unknown();
-    } else {
-      return workItem.getLocation();
     }
   }
 
diff --git a/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/KubernetesTaskRunnerTest.java b/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/KubernetesTaskRunnerTest.java
index 391db70afb2..67a5278c6a3 100644
--- a/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/KubernetesTaskRunnerTest.java
+++ b/extensions-contrib/kubernetes-overlord-extensions/src/test/java/org/apache/druid/k8s/overlord/KubernetesTaskRunnerTest.java
@@ -654,6 +654,24 @@ public class KubernetesTaskRunnerTest extends EasyMockSupport
     Assert.assertEquals(TaskLocation.create("host", 0, 1, false), taskLocation);
   }
 
+  @Test
+  public void test_getTaskLocation_throws()
+  {
+    KubernetesWorkItem workItem = new KubernetesWorkItem(task, null)
+    {
+      @Override
+      public TaskLocation getLocation()
+      {
+        throw new RuntimeException();
+      }
+    };
+
+    runner.tasks.put(task.getId(), workItem);
+
+    TaskLocation taskLocation = runner.getTaskLocation(task.getId());
+    Assert.assertEquals(TaskLocation.unknown(), taskLocation);
+  }
+
   @Test
   public void test_getTaskLocation_noTaskFound()
   {

From 01d67ae543bec181341a1136cd4e4feecf4bf66e Mon Sep 17 00:00:00 2001
From: Kashif Faraz <kashif.faraz@gmail.com>
Date: Tue, 16 Jul 2024 07:24:49 -0700
Subject: [PATCH 72/72] Allow CompactionSegmentIterator to have custom priority
 (#16737)

Changes:
- Break `NewestSegmentFirstIterator` into two parts
  - `DatasourceCompactibleSegmentIterator` - this contains all the code from `NewestSegmentFirstIterator`
  but now handles a single datasource and allows a priority to be specified
  - `PriorityBasedCompactionSegmentIterator` - contains separate iterator for each datasource and
  combines the results into a single queue to be used by a compaction search policy
- Update `NewestSegmentFirstPolicy` to use the above new classes
- Cleanup `CompactionStatistics` and `AutoCompactionSnapshot`
- Cleanup `CompactSegments`
- Remove unused methods from `Tasks`
- Remove unneeded `TasksTest`
- Move tests from `NewestSegmentFirstIteratorTest` to `CompactionStatusTest`
and `DatasourceCompactibleSegmentIteratorTest`
---
 .../NewestSegmentFirstPolicyBenchmark.java    |   2 +-
 .../druid/indexing/common/task/Tasks.java     |  38 +-
 .../druid/indexing/common/task/TasksTest.java |  94 ----
 ...ClientCompactionTaskQueryTuningConfig.java |  12 +
 .../coordinator/AutoCompactionSnapshot.java   |  91 +---
 .../CompactionSegmentSearchPolicy.java        |   4 +-
 .../compact/CompactionStatistics.java         |  16 +-
 .../coordinator/compact/CompactionStatus.java |   7 +-
 ...DataSourceCompactibleSegmentIterator.java} | 137 ++---
 .../compact/NewestSegmentFirstPolicy.java     |  15 +-
 ...riorityBasedCompactionSegmentIterator.java | 135 +++++
 .../compact/SegmentsToCompact.java            |   4 +-
 .../coordinator/duty/CompactSegments.java     | 108 ++--
 .../AutoCompactionSnapshotTest.java           |  15 +-
 .../compact/CompactionStatusTest.java         | 178 +++++++
 ...aSourceCompactibleSegmentIteratorTest.java |  77 +++
 .../NewestSegmentFirstIteratorTest.java       | 477 ------------------
 .../compact/NewestSegmentFirstPolicyTest.java | 112 ++--
 18 files changed, 587 insertions(+), 935 deletions(-)
 delete mode 100644 indexing-service/src/test/java/org/apache/druid/indexing/common/task/TasksTest.java
 rename server/src/main/java/org/apache/druid/server/coordinator/compact/{NewestSegmentFirstIterator.java => DataSourceCompactibleSegmentIterator.java} (82%)
 create mode 100644 server/src/main/java/org/apache/druid/server/coordinator/compact/PriorityBasedCompactionSegmentIterator.java
 create mode 100644 server/src/test/java/org/apache/druid/server/coordinator/compact/CompactionStatusTest.java
 create mode 100644 server/src/test/java/org/apache/druid/server/coordinator/compact/DataSourceCompactibleSegmentIteratorTest.java
 delete mode 100644 server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIteratorTest.java

diff --git a/benchmarks/src/test/java/org/apache/druid/server/coordinator/NewestSegmentFirstPolicyBenchmark.java b/benchmarks/src/test/java/org/apache/druid/server/coordinator/NewestSegmentFirstPolicyBenchmark.java
index 37f7b665927..98c27c4b2b8 100644
--- a/benchmarks/src/test/java/org/apache/druid/server/coordinator/NewestSegmentFirstPolicyBenchmark.java
+++ b/benchmarks/src/test/java/org/apache/druid/server/coordinator/NewestSegmentFirstPolicyBenchmark.java
@@ -141,7 +141,7 @@ public class NewestSegmentFirstPolicyBenchmark
   @Benchmark
   public void measureNewestSegmentFirstPolicy(Blackhole blackhole)
   {
-    final CompactionSegmentIterator iterator = policy.reset(compactionConfigs, dataSources, Collections.emptyMap());
+    final CompactionSegmentIterator iterator = policy.createIterator(compactionConfigs, dataSources, Collections.emptyMap());
     for (int i = 0; i < numCompactionTaskSlots && iterator.hasNext(); i++) {
       blackhole.consume(iterator.next());
     }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/Tasks.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/Tasks.java
index b357125dc4d..a8f268a67f1 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/task/Tasks.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/task/Tasks.java
@@ -21,16 +21,9 @@ package org.apache.druid.indexing.common.task;
 
 import org.apache.curator.shaded.com.google.common.base.Verify;
 import org.apache.druid.indexing.common.TaskLockType;
-import org.apache.druid.java.util.common.JodaUtils;
-import org.apache.druid.java.util.common.guava.Comparators;
 import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
 import org.apache.druid.server.coordinator.duty.CompactSegments;
-import org.joda.time.Interval;
 
-import java.util.ArrayList;
-import java.util.List;
-import java.util.SortedSet;
-import java.util.TreeSet;
 import java.util.concurrent.TimeUnit;
 
 public class Tasks
@@ -63,44 +56,19 @@ public class Tasks
    * Context flag denoting if maximum possible values should be used to estimate
    * on-heap memory usage while indexing. Refer to OnHeapIncrementalIndex for
    * more details.
-   *
+   * <p>
    * The value of this flag is true by default which corresponds to the old method
    * of estimation.
    */
   public static final String USE_MAX_MEMORY_ESTIMATES = "useMaxMemoryEstimates";
 
   /**
-   * This context is used in compaction. When it is set in the context, the segments created by the task
-   * will fill 'lastCompactionState' in its metadata. This will be used to track what segments are compacted or not.
-   * See {@link org.apache.druid.timeline.DataSegment} and {@link
-   * org.apache.druid.server.coordinator.compact.NewestSegmentFirstIterator} for more details.
+   * Context flag to denote if segments published to metadata by a task should
+   * have the {@code lastCompactionState} field set.
    */
   public static final String STORE_COMPACTION_STATE_KEY = "storeCompactionState";
 
   static {
     Verify.verify(STORE_COMPACTION_STATE_KEY.equals(CompactSegments.STORE_COMPACTION_STATE_KEY));
   }
-
-  public static SortedSet<Interval> computeCondensedIntervals(SortedSet<Interval> intervals)
-  {
-    final SortedSet<Interval> condensedIntervals = new TreeSet<>(Comparators.intervalsByStartThenEnd());
-    List<Interval> toBeAccumulated = new ArrayList<>();
-    for (Interval interval : intervals) {
-      if (toBeAccumulated.size() == 0) {
-        toBeAccumulated.add(interval);
-      } else {
-        if (toBeAccumulated.get(toBeAccumulated.size() - 1).abuts(interval)) {
-          toBeAccumulated.add(interval);
-        } else {
-          condensedIntervals.add(JodaUtils.umbrellaInterval(toBeAccumulated));
-          toBeAccumulated.clear();
-          toBeAccumulated.add(interval);
-        }
-      }
-    }
-    if (toBeAccumulated.size() > 0) {
-      condensedIntervals.add(JodaUtils.umbrellaInterval(toBeAccumulated));
-    }
-    return condensedIntervals;
-  }
 }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TasksTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TasksTest.java
deleted file mode 100644
index 248df1db44d..00000000000
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/task/TasksTest.java
+++ /dev/null
@@ -1,94 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.indexing.common.task;
-
-import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.java.util.common.StringUtils;
-import org.apache.druid.java.util.common.guava.Comparators;
-import org.joda.time.Interval;
-import org.junit.Assert;
-import org.junit.Test;
-
-import java.util.Iterator;
-import java.util.SortedSet;
-import java.util.TreeSet;
-
-public class TasksTest
-{
-
-  @Test
-  public void testComputeCondensedIntervals()
-  {
-    final SortedSet<Interval> inputIntervals = new TreeSet<>(Comparators.intervalsByStartThenEnd());
-    for (int m = 1; m < 13; m++) {
-      for (int d = 1; d < 10; d++) {
-        inputIntervals.add(getInterval(m, d, m, d + 1));
-      }
-
-      for (int d = 12; d < 20; d++) {
-        inputIntervals.add(getInterval(m, d, m, d + 1));
-      }
-
-      inputIntervals.add(getInterval(m, 22, m, 23));
-
-      for (int d = 25; d < 28; d++) {
-        inputIntervals.add(getInterval(m, d, m, d + 1));
-      }
-
-      if (m == 1 || m == 3 || m == 5 || m == 7 || m == 8 || m == 10) {
-        inputIntervals.add(getInterval(m, 31, m + 1, 1));
-      }
-    }
-
-    inputIntervals.add(Intervals.of("2017-12-31/2018-01-01"));
-
-    final SortedSet<Interval> condensedIntervals = Tasks.computeCondensedIntervals(inputIntervals);
-    final Iterator<Interval> condensedIntervalIterator = condensedIntervals.iterator();
-    Assert.assertTrue(condensedIntervalIterator.hasNext());
-
-    Interval condensedInterval = condensedIntervalIterator.next();
-    final SortedSet<Interval> checkedIntervals = new TreeSet<>(Comparators.intervalsByStartThenEnd());
-    for (Interval inputInterval : inputIntervals) {
-      if (!condensedInterval.contains(inputInterval)) {
-        if (condensedIntervalIterator.hasNext()) {
-          condensedInterval = condensedIntervalIterator.next();
-          Assert.assertTrue(condensedInterval.contains(inputInterval));
-        }
-      }
-      checkedIntervals.add(inputInterval);
-    }
-
-    Assert.assertFalse(condensedIntervalIterator.hasNext());
-    Assert.assertEquals(inputIntervals, checkedIntervals);
-  }
-
-  private static Interval getInterval(int startMonth, int startDay, int endMonth, int endDay)
-  {
-    return Intervals.of(
-        StringUtils.format(
-            "2017-%02d-%02d/2017-%02d-%02d",
-            startMonth,
-            startDay,
-            endMonth,
-            endDay
-        )
-    );
-  }
-}
diff --git a/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskQueryTuningConfig.java b/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskQueryTuningConfig.java
index 7b1a7c54682..55fe7d0114f 100644
--- a/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskQueryTuningConfig.java
+++ b/server/src/main/java/org/apache/druid/client/indexing/ClientCompactionTaskQueryTuningConfig.java
@@ -28,6 +28,7 @@ import org.apache.druid.segment.IndexSpec;
 import org.apache.druid.segment.incremental.AppendableIndexSpec;
 import org.apache.druid.segment.incremental.OnheapIncrementalIndex;
 import org.apache.druid.segment.writeout.SegmentWriteOutMediumFactory;
+import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
 import org.apache.druid.server.coordinator.UserCompactionTaskQueryTuningConfig;
 import org.joda.time.Duration;
 
@@ -79,6 +80,17 @@ public class ClientCompactionTaskQueryTuningConfig
   @Nullable
   private final AppendableIndexSpec appendableIndexSpec;
 
+  public static ClientCompactionTaskQueryTuningConfig from(
+      DataSourceCompactionConfig compactionConfig
+  )
+  {
+    if (compactionConfig == null) {
+      return from(null, null, null);
+    } else {
+      return from(compactionConfig.getTuningConfig(), compactionConfig.getMaxRowsPerSegment(), null);
+    }
+  }
+
   public static ClientCompactionTaskQueryTuningConfig from(
       @Nullable UserCompactionTaskQueryTuningConfig userCompactionTaskQueryTuningConfig,
       @Nullable Integer maxRowsPerSegment,
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/AutoCompactionSnapshot.java b/server/src/main/java/org/apache/druid/server/coordinator/AutoCompactionSnapshot.java
index fe46eabb426..d52d4e9eba0 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/AutoCompactionSnapshot.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/AutoCompactionSnapshot.java
@@ -22,6 +22,7 @@ package org.apache.druid.server.coordinator;
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonProperty;
 import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.server.coordinator.compact.CompactionStatistics;
 
 import javax.validation.constraints.NotNull;
 import java.util.Objects;
@@ -193,15 +194,9 @@ public class AutoCompactionSnapshot
     private final String dataSource;
     private final AutoCompactionScheduleStatus scheduleStatus;
 
-    private long bytesAwaitingCompaction;
-    private long bytesCompacted;
-    private long bytesSkipped;
-    private long segmentCountAwaitingCompaction;
-    private long segmentCountCompacted;
-    private long segmentCountSkipped;
-    private long intervalCountAwaitingCompaction;
-    private long intervalCountCompacted;
-    private long intervalCountSkipped;
+    private final CompactionStatistics compactedStats = new CompactionStatistics();
+    private final CompactionStatistics skippedStats = new CompactionStatistics();
+    private final CompactionStatistics waitingStats = new CompactionStatistics();
 
     private Builder(
         @NotNull String dataSource,
@@ -217,69 +212,21 @@ public class AutoCompactionSnapshot
 
       this.dataSource = dataSource;
       this.scheduleStatus = scheduleStatus;
-      this.bytesAwaitingCompaction = 0;
-      this.bytesCompacted = 0;
-      this.bytesSkipped = 0;
-      this.segmentCountAwaitingCompaction = 0;
-      this.segmentCountCompacted = 0;
-      this.segmentCountSkipped = 0;
-      this.intervalCountAwaitingCompaction = 0;
-      this.intervalCountCompacted = 0;
-      this.intervalCountSkipped = 0;
     }
 
-    public Builder incrementBytesAwaitingCompaction(long incrementValue)
+    public void incrementWaitingStats(CompactionStatistics entry)
     {
-      this.bytesAwaitingCompaction = this.bytesAwaitingCompaction + incrementValue;
-      return this;
+      waitingStats.increment(entry);
     }
 
-    public Builder incrementBytesCompacted(long incrementValue)
+    public void incrementCompactedStats(CompactionStatistics entry)
     {
-      this.bytesCompacted = this.bytesCompacted + incrementValue;
-      return this;
+      compactedStats.increment(entry);
     }
 
-    public Builder incrementSegmentCountAwaitingCompaction(long incrementValue)
+    public void incrementSkippedStats(CompactionStatistics entry)
     {
-      this.segmentCountAwaitingCompaction = this.segmentCountAwaitingCompaction + incrementValue;
-      return this;
-    }
-
-    public Builder incrementSegmentCountCompacted(long incrementValue)
-    {
-      this.segmentCountCompacted = this.segmentCountCompacted + incrementValue;
-      return this;
-    }
-
-    public Builder incrementIntervalCountAwaitingCompaction(long incrementValue)
-    {
-      this.intervalCountAwaitingCompaction = this.intervalCountAwaitingCompaction + incrementValue;
-      return this;
-    }
-
-    public Builder incrementIntervalCountCompacted(long incrementValue)
-    {
-      this.intervalCountCompacted = this.intervalCountCompacted + incrementValue;
-      return this;
-    }
-
-    public Builder incrementBytesSkipped(long incrementValue)
-    {
-      this.bytesSkipped = this.bytesSkipped + incrementValue;
-      return this;
-    }
-
-    public Builder incrementSegmentCountSkipped(long incrementValue)
-    {
-      this.segmentCountSkipped = this.segmentCountSkipped + incrementValue;
-      return this;
-    }
-
-    public Builder incrementIntervalCountSkipped(long incrementValue)
-    {
-      this.intervalCountSkipped = this.intervalCountSkipped + incrementValue;
-      return this;
+      skippedStats.increment(entry);
     }
 
     public AutoCompactionSnapshot build()
@@ -287,15 +234,15 @@ public class AutoCompactionSnapshot
       return new AutoCompactionSnapshot(
           dataSource,
           scheduleStatus,
-          bytesAwaitingCompaction,
-          bytesCompacted,
-          bytesSkipped,
-          segmentCountAwaitingCompaction,
-          segmentCountCompacted,
-          segmentCountSkipped,
-          intervalCountAwaitingCompaction,
-          intervalCountCompacted,
-          intervalCountSkipped
+          waitingStats.getTotalBytes(),
+          compactedStats.getTotalBytes(),
+          skippedStats.getTotalBytes(),
+          waitingStats.getNumSegments(),
+          compactedStats.getNumSegments(),
+          skippedStats.getNumSegments(),
+          waitingStats.getNumIntervals(),
+          compactedStats.getNumIntervals(),
+          skippedStats.getNumIntervals()
       );
     }
   }
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionSegmentSearchPolicy.java b/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionSegmentSearchPolicy.java
index 5a006908c31..cc5f4f59d85 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionSegmentSearchPolicy.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionSegmentSearchPolicy.java
@@ -33,9 +33,9 @@ import java.util.Map;
 public interface CompactionSegmentSearchPolicy
 {
   /**
-   * Reset the current states of this policy. This method should be called whenever iterating starts.
+   * Creates an iterator that returns compactible segments.
    */
-  CompactionSegmentIterator reset(
+  CompactionSegmentIterator createIterator(
       Map<String, DataSourceCompactionConfig> compactionConfigs,
       Map<String, SegmentTimeline> dataSources,
       Map<String, List<Interval>> skipIntervals
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionStatistics.java b/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionStatistics.java
index dd672ce4480..6997dec47c0 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionStatistics.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionStatistics.java
@@ -28,9 +28,13 @@ public class CompactionStatistics
   private long numSegments;
   private long numIntervals;
 
-  public static CompactionStatistics create()
+  public static CompactionStatistics create(long bytes, long numSegments, long numIntervals)
   {
-    return new CompactionStatistics();
+    final CompactionStatistics stats = new CompactionStatistics();
+    stats.totalBytes = bytes;
+    stats.numIntervals = numIntervals;
+    stats.numSegments = numSegments;
+    return stats;
   }
 
   public long getTotalBytes()
@@ -48,10 +52,10 @@ public class CompactionStatistics
     return numIntervals;
   }
 
-  public void addFrom(SegmentsToCompact segments)
+  public void increment(CompactionStatistics other)
   {
-    totalBytes += segments.getTotalBytes();
-    numIntervals += segments.getNumIntervals();
-    numSegments += segments.size();
+    totalBytes += other.getTotalBytes();
+    numIntervals += other.getNumIntervals();
+    numSegments += other.getNumSegments();
   }
 }
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionStatus.java b/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionStatus.java
index 862f2e7c5b4..fa053fb8d6a 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionStatus.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/compact/CompactionStatus.java
@@ -167,12 +167,7 @@ public class CompactionStatus
       this.objectMapper = objectMapper;
       this.lastCompactionState = candidateSegments.getFirst().getLastCompactionState();
       this.compactionConfig = compactionConfig;
-      this.tuningConfig = ClientCompactionTaskQueryTuningConfig.from(
-          compactionConfig.getTuningConfig(),
-          compactionConfig.getMaxRowsPerSegment(),
-          null
-      );
-
+      this.tuningConfig = ClientCompactionTaskQueryTuningConfig.from(compactionConfig);
       this.configuredGranularitySpec = compactionConfig.getGranularitySpec();
       if (lastCompactionState == null) {
         this.existingGranularitySpec = null;
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIterator.java b/server/src/main/java/org/apache/druid/server/coordinator/compact/DataSourceCompactibleSegmentIterator.java
similarity index 82%
rename from server/src/main/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIterator.java
rename to server/src/main/java/org/apache/druid/server/coordinator/compact/DataSourceCompactibleSegmentIterator.java
index c4ae771f808..c086be3112b 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIterator.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/compact/DataSourceCompactibleSegmentIterator.java
@@ -23,9 +23,7 @@ import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Preconditions;
 import com.google.common.collect.Lists;
-import com.google.common.collect.Maps;
 import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.JodaUtils;
 import org.apache.druid.java.util.common.granularity.Granularity;
@@ -59,44 +57,46 @@ import java.util.Set;
 import java.util.stream.Collectors;
 
 /**
- * This class iterates all segments of the dataSources configured for compaction from the newest to the oldest.
+ * Iterator over compactible segments of a datasource in order of specified priority.
  */
-public class NewestSegmentFirstIterator implements CompactionSegmentIterator
+public class DataSourceCompactibleSegmentIterator implements Iterator<SegmentsToCompact>
 {
-  private static final Logger log = new Logger(NewestSegmentFirstIterator.class);
+  private static final Logger log = new Logger(DataSourceCompactibleSegmentIterator.class);
 
+  private final String dataSource;
   private final ObjectMapper objectMapper;
-  private final Map<String, DataSourceCompactionConfig> compactionConfigs;
-  private final Map<String, CompactionStatistics> compactedSegmentStats = new HashMap<>();
-  private final Map<String, CompactionStatistics> skippedSegmentStats = new HashMap<>();
-
-  private final Map<String, CompactibleSegmentIterator> timelineIterators;
+  private final DataSourceCompactionConfig config;
+  private final CompactionStatistics compactedSegmentStats = new CompactionStatistics();
+  private final CompactionStatistics skippedSegmentStats = new CompactionStatistics();
 
   // This is needed for datasource that has segmentGranularity configured
   // If configured segmentGranularity in config is finer than current segmentGranularity, the same set of segments
   // can belong to multiple intervals in the timeline. We keep track of the compacted intervals between each
   // run of the compaction job and skip any interval that was already previously compacted.
-  private final Map<String, Set<Interval>> intervalCompactedForDatasource = new HashMap<>();
+  private final Set<Interval> compactedIntervals = new HashSet<>();
 
-  private final PriorityQueue<SegmentsToCompact> queue = new PriorityQueue<>(
-      (o1, o2) -> Comparators.intervalsByStartThenEnd().compare(o2.getUmbrellaInterval(), o1.getUmbrellaInterval())
-  );
+  private final PriorityQueue<SegmentsToCompact> queue;
 
-  NewestSegmentFirstIterator(
-      ObjectMapper objectMapper,
-      Map<String, DataSourceCompactionConfig> compactionConfigs,
-      Map<String, SegmentTimeline> dataSources,
-      Map<String, List<Interval>> skipIntervals
+  public DataSourceCompactibleSegmentIterator(
+      DataSourceCompactionConfig config,
+      SegmentTimeline timeline,
+      List<Interval> skipIntervals,
+      Comparator<SegmentsToCompact> segmentPriority,
+      ObjectMapper objectMapper
   )
   {
     this.objectMapper = objectMapper;
-    this.compactionConfigs = compactionConfigs;
-    this.timelineIterators = Maps.newHashMapWithExpectedSize(dataSources.size());
+    this.config = config;
+    this.dataSource = config.getDataSource();
+    this.queue = new PriorityQueue<>(segmentPriority);
+    populateQueue(timeline, skipIntervals);
+  }
 
-    dataSources.forEach((dataSource, timeline) -> {
-      final DataSourceCompactionConfig config = compactionConfigs.get(dataSource);
+  private void populateQueue(SegmentTimeline timeline, List<Interval> skipIntervals)
+  {
+    if (timeline != null) {
       Granularity configuredSegmentGranularity = null;
-      if (config != null && !timeline.isEmpty()) {
+      if (!timeline.isEmpty()) {
         SegmentTimeline originalTimeline = null;
         if (config.getGranularitySpec() != null && config.getGranularitySpec().getSegmentGranularity() != null) {
           String temporaryVersion = DateTimes.nowUtc().toString();
@@ -154,33 +154,25 @@ public class NewestSegmentFirstIterator implements CompactionSegmentIterator
             timeline,
             config.getSkipOffsetFromLatest(),
             configuredSegmentGranularity,
-            skipIntervals.get(dataSource)
+            skipIntervals
         );
         if (!searchIntervals.isEmpty()) {
-          timelineIterators.put(
-              dataSource,
+          findAndEnqueueSegmentsToCompact(
               new CompactibleSegmentIterator(timeline, searchIntervals, originalTimeline)
           );
+        } else {
+          log.warn("Skipping compaction for datasource[%s] as it has no compactible segments.", dataSource);
         }
       }
-    });
-
-    compactionConfigs.forEach((dataSourceName, config) -> {
-      if (config == null) {
-        throw new ISE("Unknown dataSource[%s]", dataSourceName);
-      }
-      updateQueue(dataSourceName, config);
-    });
+    }
   }
 
-  @Override
-  public Map<String, CompactionStatistics> totalCompactedStatistics()
+  public CompactionStatistics totalCompactedStatistics()
   {
     return compactedSegmentStats;
   }
 
-  @Override
-  public Map<String, CompactionStatistics> totalSkippedStatistics()
+  public CompactionStatistics totalSkippedStatistics()
   {
     return skippedSegmentStats;
   }
@@ -206,25 +198,9 @@ public class NewestSegmentFirstIterator implements CompactionSegmentIterator
     final List<DataSegment> resultSegments = entry.getSegments();
     Preconditions.checkState(!resultSegments.isEmpty(), "Queue entry must not be empty");
 
-    final String dataSource = resultSegments.get(0).getDataSource();
-    updateQueue(dataSource, compactionConfigs.get(dataSource));
-
     return entry;
   }
 
-  /**
-   * Find the next segments to compact for the given dataSource and add them to the queue.
-   * {@link #timelineIterators} is updated according to the found segments. That is, the found segments are removed from
-   * the timeline of the given dataSource.
-   */
-  private void updateQueue(String dataSourceName, DataSourceCompactionConfig config)
-  {
-    final SegmentsToCompact segmentsToCompact = findSegmentsToCompact(dataSourceName, config);
-    if (!segmentsToCompact.isEmpty()) {
-      queue.add(segmentsToCompact);
-    }
-  }
-
   /**
    * Iterates compactible segments in a {@link SegmentTimeline}.
    */
@@ -315,27 +291,12 @@ public class NewestSegmentFirstIterator implements CompactionSegmentIterator
   }
 
   /**
-   * Finds segments to compact together for the given datasource.
-   *
-   * @return An empty {@link SegmentsToCompact} if there are no eligible candidates.
+   * Finds segments to compact together for the given datasource and adds them to
+   * the priority queue.
    */
-  private SegmentsToCompact findSegmentsToCompact(
-      final String dataSourceName,
-      final DataSourceCompactionConfig config
-  )
+  private void findAndEnqueueSegmentsToCompact(CompactibleSegmentIterator compactibleSegmentIterator)
   {
-    final CompactibleSegmentIterator compactibleSegmentIterator
-        = timelineIterators.get(dataSourceName);
-    if (compactibleSegmentIterator == null) {
-      log.warn(
-          "Skipping compaction for datasource[%s] as there is no compactible segment in its timeline.",
-          dataSourceName
-      );
-      return SegmentsToCompact.empty();
-    }
-
     final long inputSegmentSize = config.getInputSegmentSizeBytes();
-
     while (compactibleSegmentIterator.hasNext()) {
       List<DataSegment> segments = compactibleSegmentIterator.next();
 
@@ -352,47 +313,33 @@ public class NewestSegmentFirstIterator implements CompactionSegmentIterator
       if (!compactionStatus.isComplete()) {
         log.debug(
             "Datasource[%s], interval[%s] has [%d] segments that need to be compacted because [%s].",
-            dataSourceName, interval, candidates.size(), compactionStatus.getReasonToCompact()
+            dataSource, interval, candidates.size(), compactionStatus.getReasonToCompact()
         );
       }
 
       if (compactionStatus.isComplete()) {
-        addSegmentStatsTo(compactedSegmentStats, dataSourceName, candidates);
+        compactedSegmentStats.increment(candidates.getStats());
       } else if (candidates.getTotalBytes() > inputSegmentSize) {
-        addSegmentStatsTo(skippedSegmentStats, dataSourceName, candidates);
+        skippedSegmentStats.increment(candidates.getStats());
         log.warn(
             "Skipping compaction for datasource[%s], interval[%s] as total segment size[%d]"
             + " is larger than allowed inputSegmentSize[%d].",
-            dataSourceName, interval, candidates.getTotalBytes(), inputSegmentSize
+            dataSource, interval, candidates.getTotalBytes(), inputSegmentSize
         );
       } else if (config.getGranularitySpec() != null
                  && config.getGranularitySpec().getSegmentGranularity() != null) {
-        Set<Interval> compactedIntervals = intervalCompactedForDatasource
-            .computeIfAbsent(dataSourceName, k -> new HashSet<>());
-
         if (compactedIntervals.contains(interval)) {
           // Skip these candidate segments as we have already compacted this interval
         } else {
           compactedIntervals.add(interval);
-          return candidates;
+          queue.add(candidates);
         }
       } else {
-        return candidates;
+        queue.add(candidates);
       }
     }
 
-    log.debug("No more segments to compact for datasource[%s].", dataSourceName);
-    return SegmentsToCompact.empty();
-  }
-
-  private void addSegmentStatsTo(
-      Map<String, CompactionStatistics> statisticsMap,
-      String dataSourceName,
-      SegmentsToCompact segments
-  )
-  {
-    statisticsMap.computeIfAbsent(dataSourceName, v -> CompactionStatistics.create())
-                 .addFrom(segments);
+    log.debug("No more segments to compact for datasource[%s].", dataSource);
   }
 
   /**
@@ -428,7 +375,7 @@ public class NewestSegmentFirstIterator implements CompactionSegmentIterator
       final List<DataSegment> segments = new ArrayList<>(
           timeline.findNonOvershadowedObjectsInInterval(skipInterval, Partitions.ONLY_COMPLETE)
       );
-      addSegmentStatsTo(skippedSegmentStats, dataSourceName, SegmentsToCompact.from(segments));
+      skippedSegmentStats.increment(SegmentsToCompact.from(segments).getStats());
     }
 
     final Interval totalInterval = new Interval(first.getInterval().getStart(), last.getInterval().getEnd());
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicy.java b/server/src/main/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicy.java
index 20f6d920441..bc923da4f80 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicy.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicy.java
@@ -21,6 +21,7 @@ package org.apache.druid.server.coordinator.compact;
 
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.inject.Inject;
+import org.apache.druid.java.util.common.guava.Comparators;
 import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
 import org.apache.druid.timeline.SegmentTimeline;
 import org.joda.time.Interval;
@@ -29,7 +30,7 @@ import java.util.List;
 import java.util.Map;
 
 /**
- * This policy searches segments for compaction from the newest one to oldest one.
+ * This policy searches segments for compaction from newest to oldest.
  */
 public class NewestSegmentFirstPolicy implements CompactionSegmentSearchPolicy
 {
@@ -42,12 +43,20 @@ public class NewestSegmentFirstPolicy implements CompactionSegmentSearchPolicy
   }
 
   @Override
-  public CompactionSegmentIterator reset(
+  public CompactionSegmentIterator createIterator(
       Map<String, DataSourceCompactionConfig> compactionConfigs,
       Map<String, SegmentTimeline> dataSources,
       Map<String, List<Interval>> skipIntervals
   )
   {
-    return new NewestSegmentFirstIterator(objectMapper, compactionConfigs, dataSources, skipIntervals);
+    return new PriorityBasedCompactionSegmentIterator(
+        compactionConfigs,
+        dataSources,
+        skipIntervals,
+        (o1, o2) -> Comparators.intervalsByStartThenEnd()
+                               .compare(o2.getUmbrellaInterval(), o1.getUmbrellaInterval()),
+        objectMapper
+    );
   }
+
 }
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/compact/PriorityBasedCompactionSegmentIterator.java b/server/src/main/java/org/apache/druid/server/coordinator/compact/PriorityBasedCompactionSegmentIterator.java
new file mode 100644
index 00000000000..33aea2a0451
--- /dev/null
+++ b/server/src/main/java/org/apache/druid/server/coordinator/compact/PriorityBasedCompactionSegmentIterator.java
@@ -0,0 +1,135 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.server.coordinator.compact;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.base.Preconditions;
+import com.google.common.collect.Maps;
+import org.apache.druid.error.DruidException;
+import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
+import org.apache.druid.timeline.SegmentTimeline;
+import org.apache.druid.utils.CollectionUtils;
+import org.joda.time.Interval;
+
+import java.util.Collections;
+import java.util.Comparator;
+import java.util.List;
+import java.util.Map;
+import java.util.NoSuchElementException;
+import java.util.PriorityQueue;
+
+/**
+ * Implementation of {@link CompactionSegmentIterator} that returns segments in
+ * order of their priority.
+ */
+public class PriorityBasedCompactionSegmentIterator implements CompactionSegmentIterator
+{
+  private static final Logger log = new Logger(PriorityBasedCompactionSegmentIterator.class);
+
+  private final PriorityQueue<SegmentsToCompact> queue;
+  private final Map<String, DataSourceCompactibleSegmentIterator> datasourceIterators;
+
+  public PriorityBasedCompactionSegmentIterator(
+      Map<String, DataSourceCompactionConfig> compactionConfigs,
+      Map<String, SegmentTimeline> datasourceToTimeline,
+      Map<String, List<Interval>> skipIntervals,
+      Comparator<SegmentsToCompact> segmentPriority,
+      ObjectMapper objectMapper
+  )
+  {
+    this.queue = new PriorityQueue<>(segmentPriority);
+    this.datasourceIterators = Maps.newHashMapWithExpectedSize(datasourceToTimeline.size());
+    compactionConfigs.forEach((datasource, config) -> {
+      if (config == null) {
+        throw DruidException.defensive("Invalid null compaction config for dataSource[%s].", datasource);
+      }
+      final SegmentTimeline timeline = datasourceToTimeline.get(datasource);
+      if (timeline == null) {
+        log.warn("Skipping compaction for datasource[%s] as it has no timeline.", datasource);
+        return;
+      }
+
+      datasourceIterators.put(
+          datasource,
+          new DataSourceCompactibleSegmentIterator(
+              compactionConfigs.get(datasource),
+              timeline,
+              skipIntervals.getOrDefault(datasource, Collections.emptyList()),
+              segmentPriority,
+              objectMapper
+          )
+      );
+      addNextItemForDatasourceToQueue(datasource);
+    });
+  }
+
+  @Override
+  public Map<String, CompactionStatistics> totalCompactedStatistics()
+  {
+    return CollectionUtils.mapValues(
+        datasourceIterators,
+        DataSourceCompactibleSegmentIterator::totalCompactedStatistics
+    );
+  }
+
+  @Override
+  public Map<String, CompactionStatistics> totalSkippedStatistics()
+  {
+    return CollectionUtils.mapValues(
+        datasourceIterators,
+        DataSourceCompactibleSegmentIterator::totalSkippedStatistics
+    );
+  }
+
+  @Override
+  public boolean hasNext()
+  {
+    return !queue.isEmpty();
+  }
+
+  @Override
+  public SegmentsToCompact next()
+  {
+    if (!hasNext()) {
+      throw new NoSuchElementException();
+    }
+
+    final SegmentsToCompact entry = queue.poll();
+    if (entry == null) {
+      throw new NoSuchElementException();
+    }
+    Preconditions.checkState(!entry.isEmpty(), "Queue entry must not be empty");
+
+    addNextItemForDatasourceToQueue(entry.getFirst().getDataSource());
+    return entry;
+  }
+
+  private void addNextItemForDatasourceToQueue(String dataSourceName)
+  {
+    final DataSourceCompactibleSegmentIterator iterator = datasourceIterators.get(dataSourceName);
+    if (iterator.hasNext()) {
+      final SegmentsToCompact segmentsToCompact = iterator.next();
+      if (!segmentsToCompact.isEmpty()) {
+        queue.add(segmentsToCompact);
+      }
+    }
+  }
+}
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/compact/SegmentsToCompact.java b/server/src/main/java/org/apache/druid/server/coordinator/compact/SegmentsToCompact.java
index 1bc53b7dbe7..27ce9beab81 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/compact/SegmentsToCompact.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/compact/SegmentsToCompact.java
@@ -107,9 +107,9 @@ public class SegmentsToCompact
     return umbrellaInterval;
   }
 
-  public long getNumIntervals()
+  public CompactionStatistics getStats()
   {
-    return numIntervals;
+    return CompactionStatistics.create(totalBytes, size(), numIntervals);
   }
 
   @Override
diff --git a/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java b/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java
index 90fb684db6c..01f3bc77e9e 100644
--- a/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java
+++ b/server/src/main/java/org/apache/druid/server/coordinator/duty/CompactSegments.java
@@ -54,7 +54,6 @@ import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
 import org.apache.druid.server.coordinator.DruidCoordinatorRuntimeParams;
 import org.apache.druid.server.coordinator.compact.CompactionSegmentIterator;
 import org.apache.druid.server.coordinator.compact.CompactionSegmentSearchPolicy;
-import org.apache.druid.server.coordinator.compact.CompactionStatistics;
 import org.apache.druid.server.coordinator.compact.SegmentsToCompact;
 import org.apache.druid.server.coordinator.stats.CoordinatorRunStats;
 import org.apache.druid.server.coordinator.stats.Dimension;
@@ -87,6 +86,7 @@ public class CompactSegments implements CoordinatorCustomDuty
 
   private static final Logger LOG = new Logger(CompactSegments.class);
 
+  private static final String TASK_ID_PREFIX = "coordinator-issued";
   private static final Predicate<TaskStatusPlus> IS_COMPACTION_TASK =
       status -> null != status && COMPACTION_TASK_TYPE.equals(status.getType());
 
@@ -196,7 +196,7 @@ public class CompactSegments implements CoordinatorCustomDuty
     // Get iterator over segments to compact and submit compaction tasks
     Map<String, SegmentTimeline> dataSources = params.getUsedSegmentsTimelinesPerDataSource();
     final CompactionSegmentIterator iterator =
-        policy.reset(compactionConfigs, dataSources, intervalsToSkipCompaction);
+        policy.createIterator(compactionConfigs, dataSources, intervalsToSkipCompaction);
 
     final int compactionTaskCapacity = getCompactionTaskCapacity(dynamicConfig);
     final int availableCompactionTaskSlots
@@ -215,7 +215,7 @@ public class CompactSegments implements CoordinatorCustomDuty
     stats.add(Stats.Compaction.MAX_SLOTS, compactionTaskCapacity);
     stats.add(Stats.Compaction.AVAILABLE_SLOTS, availableCompactionTaskSlots);
     stats.add(Stats.Compaction.SUBMITTED_TASKS, numSubmittedCompactionTasks);
-    addCompactionSnapshotStats(currentRunAutoCompactionSnapshotBuilders, iterator, stats);
+    updateCompactionSnapshotStats(currentRunAutoCompactionSnapshotBuilders, iterator, stats);
 
     return params;
   }
@@ -392,28 +392,19 @@ public class CompactSegments implements CoordinatorCustomDuty
 
     while (iterator.hasNext() && totalTaskSlotsAssigned < numAvailableCompactionTaskSlots) {
       final SegmentsToCompact entry = iterator.next();
-      final List<DataSegment> segmentsToCompact = entry.getSegments();
-      if (segmentsToCompact.isEmpty()) {
+      if (entry.isEmpty()) {
         throw new ISE("segmentsToCompact is empty?");
       }
 
-      final String dataSourceName = segmentsToCompact.get(0).getDataSource();
+      final String dataSourceName = entry.getFirst().getDataSource();
 
       // As these segments will be compacted, we will aggregate the statistic to the Compacted statistics
-      AutoCompactionSnapshot.Builder snapshotBuilder = currentRunAutoCompactionSnapshotBuilders.computeIfAbsent(
-          dataSourceName,
-          AutoCompactionSnapshot::builder
-      );
-      snapshotBuilder
-          .incrementBytesCompacted(
-              segmentsToCompact.stream().mapToLong(DataSegment::getSize).sum()
-          )
-          .incrementIntervalCountCompacted(
-              segmentsToCompact.stream().map(DataSegment::getInterval).distinct().count()
-          )
-          .incrementSegmentCountCompacted(segmentsToCompact.size());
+      currentRunAutoCompactionSnapshotBuilders
+          .computeIfAbsent(dataSourceName, AutoCompactionSnapshot::builder)
+          .incrementCompactedStats(entry.getStats());
 
       final DataSourceCompactionConfig config = compactionConfigs.get(dataSourceName);
+      final List<DataSegment> segmentsToCompact = entry.getSegments();
 
       // Create granularitySpec to send to compaction task
       ClientCompactionTaskGranularitySpec granularitySpec;
@@ -514,7 +505,6 @@ public class CompactSegments implements CoordinatorCustomDuty
       }
 
       final String taskId = compactSegments(
-          "coordinator-issued",
           segmentsToCompact,
           config.getTaskPriority(),
           ClientCompactionTaskQueryTuningConfig.from(
@@ -536,7 +526,6 @@ public class CompactSegments implements CoordinatorCustomDuty
           taskId, segmentsToCompact.size(), dataSourceName, entry.getUmbrellaInterval()
       );
       LOG.debugSegments(segmentsToCompact, "Compacting segments");
-      // Count the compaction task itself + its sub tasks
       numSubmittedTasks++;
       totalTaskSlotsAssigned += slotsRequiredForCurrentTask;
     }
@@ -554,7 +543,7 @@ public class CompactSegments implements CoordinatorCustomDuty
     return newContext;
   }
 
-  private void addCompactionSnapshotStats(
+  private void updateCompactionSnapshotStats(
       Map<String, AutoCompactionSnapshot.Builder> currentRunAutoCompactionSnapshotBuilders,
       CompactionSegmentIterator iterator,
       CoordinatorRunStats stats
@@ -563,77 +552,45 @@ public class CompactSegments implements CoordinatorCustomDuty
     // Mark all the segments remaining in the iterator as "awaiting compaction"
     while (iterator.hasNext()) {
       final SegmentsToCompact entry = iterator.next();
-      final List<DataSegment> segmentsToCompact = entry.getSegments();
-      if (!segmentsToCompact.isEmpty()) {
-        final String dataSourceName = segmentsToCompact.get(0).getDataSource();
-        AutoCompactionSnapshot.Builder snapshotBuilder = currentRunAutoCompactionSnapshotBuilders.computeIfAbsent(
-            dataSourceName,
-            AutoCompactionSnapshot::builder
-        );
-        snapshotBuilder
-            .incrementBytesAwaitingCompaction(
-                segmentsToCompact.stream().mapToLong(DataSegment::getSize).sum()
-            )
-            .incrementIntervalCountAwaitingCompaction(
-                segmentsToCompact.stream().map(DataSegment::getInterval).distinct().count()
-            )
-            .incrementSegmentCountAwaitingCompaction(segmentsToCompact.size());
+      if (!entry.isEmpty()) {
+        final String dataSourceName = entry.getFirst().getDataSource();
+        currentRunAutoCompactionSnapshotBuilders
+            .computeIfAbsent(dataSourceName, AutoCompactionSnapshot::builder)
+            .incrementWaitingStats(entry.getStats());
       }
     }
 
     // Statistics of all segments considered compacted after this run
-    Map<String, CompactionStatistics> allCompactedStatistics = iterator.totalCompactedStatistics();
-    for (Map.Entry<String, CompactionStatistics> compactionStatisticsEntry : allCompactedStatistics.entrySet()) {
-      final String dataSource = compactionStatisticsEntry.getKey();
-      final CompactionStatistics dataSourceCompactedStatistics = compactionStatisticsEntry.getValue();
-      AutoCompactionSnapshot.Builder builder = currentRunAutoCompactionSnapshotBuilders.computeIfAbsent(
-          dataSource,
-          AutoCompactionSnapshot::builder
-      );
-      builder.incrementBytesCompacted(dataSourceCompactedStatistics.getTotalBytes());
-      builder.incrementSegmentCountCompacted(dataSourceCompactedStatistics.getNumSegments());
-      builder.incrementIntervalCountCompacted(dataSourceCompactedStatistics.getNumIntervals());
-    }
+    iterator.totalCompactedStatistics().forEach((dataSource, compactedStats) -> {
+      currentRunAutoCompactionSnapshotBuilders
+          .computeIfAbsent(dataSource, AutoCompactionSnapshot::builder)
+          .incrementCompactedStats(compactedStats);
+    });
 
     // Statistics of all segments considered skipped after this run
-    Map<String, CompactionStatistics> allSkippedStatistics = iterator.totalSkippedStatistics();
-    for (Map.Entry<String, CompactionStatistics> compactionStatisticsEntry : allSkippedStatistics.entrySet()) {
-      final String dataSource = compactionStatisticsEntry.getKey();
-      final CompactionStatistics dataSourceSkippedStatistics = compactionStatisticsEntry.getValue();
-      AutoCompactionSnapshot.Builder builder = currentRunAutoCompactionSnapshotBuilders.computeIfAbsent(
-          dataSource,
-          AutoCompactionSnapshot::builder
-      );
-      builder.incrementBytesSkipped(dataSourceSkippedStatistics.getTotalBytes())
-             .incrementSegmentCountSkipped(dataSourceSkippedStatistics.getNumSegments())
-             .incrementIntervalCountSkipped(dataSourceSkippedStatistics.getNumIntervals());
-    }
+    iterator.totalSkippedStatistics().forEach((dataSource, dataSourceSkippedStatistics) -> {
+      currentRunAutoCompactionSnapshotBuilders
+          .computeIfAbsent(dataSource, AutoCompactionSnapshot::builder)
+          .incrementSkippedStats(dataSourceSkippedStatistics);
+    });
 
     final Map<String, AutoCompactionSnapshot> currentAutoCompactionSnapshotPerDataSource = new HashMap<>();
-    for (Map.Entry<String, AutoCompactionSnapshot.Builder> autoCompactionSnapshotBuilderEntry
-        : currentRunAutoCompactionSnapshotBuilders.entrySet()) {
-      final String dataSource = autoCompactionSnapshotBuilderEntry.getKey();
-      final AutoCompactionSnapshot.Builder builder = autoCompactionSnapshotBuilderEntry.getValue();
-
-      // Build the complete snapshot for the datasource
-      AutoCompactionSnapshot autoCompactionSnapshot = builder.build();
+    currentRunAutoCompactionSnapshotBuilders.forEach((dataSource, builder) -> {
+      final AutoCompactionSnapshot autoCompactionSnapshot = builder.build();
       currentAutoCompactionSnapshotPerDataSource.put(dataSource, autoCompactionSnapshot);
-
-      // Use the complete snapshot to emit metrics
-      addStatsForDatasource(dataSource, autoCompactionSnapshot, stats);
-    }
+      collectSnapshotStats(autoCompactionSnapshot, stats);
+    });
 
     // Atomic update of autoCompactionSnapshotPerDataSource with the latest from this coordinator run
     autoCompactionSnapshotPerDataSource.set(currentAutoCompactionSnapshotPerDataSource);
   }
 
-  private void addStatsForDatasource(
-      String dataSource,
+  private void collectSnapshotStats(
       AutoCompactionSnapshot autoCompactionSnapshot,
       CoordinatorRunStats stats
   )
   {
-    final RowKey rowKey = RowKey.of(Dimension.DATASOURCE, dataSource);
+    final RowKey rowKey = RowKey.of(Dimension.DATASOURCE, autoCompactionSnapshot.getDataSource());
 
     stats.add(Stats.Compaction.PENDING_BYTES, rowKey, autoCompactionSnapshot.getBytesAwaitingCompaction());
     stats.add(Stats.Compaction.PENDING_SEGMENTS, rowKey, autoCompactionSnapshot.getSegmentCountAwaitingCompaction());
@@ -668,7 +625,6 @@ public class CompactSegments implements CoordinatorCustomDuty
   }
 
   private String compactSegments(
-      String idPrefix,
       List<DataSegment> segments,
       int compactionTaskPriority,
       @Nullable ClientCompactionTaskQueryTuningConfig tuningConfig,
@@ -692,7 +648,7 @@ public class CompactSegments implements CoordinatorCustomDuty
     context = context == null ? new HashMap<>() : context;
     context.put("priority", compactionTaskPriority);
 
-    final String taskId = IdUtils.newTaskId(idPrefix, ClientCompactionTaskQuery.TYPE, dataSource, null);
+    final String taskId = IdUtils.newTaskId(TASK_ID_PREFIX, ClientCompactionTaskQuery.TYPE, dataSource, null);
     final Granularity segmentGranularity = granularitySpec == null ? null : granularitySpec.getSegmentGranularity();
     final ClientTaskQuery taskPayload = new ClientCompactionTaskQuery(
         taskId,
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/AutoCompactionSnapshotTest.java b/server/src/test/java/org/apache/druid/server/coordinator/AutoCompactionSnapshotTest.java
index e034459fc74..5517bf9e6a4 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/AutoCompactionSnapshotTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/AutoCompactionSnapshotTest.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.server.coordinator;
 
+import org.apache.druid.server.coordinator.compact.CompactionStatistics;
 import org.junit.Assert;
 import org.junit.Test;
 
@@ -30,17 +31,11 @@ public class AutoCompactionSnapshotTest
     final String expectedDataSource = "data";
     final AutoCompactionSnapshot.Builder builder = AutoCompactionSnapshot.builder(expectedDataSource);
 
-    // Increment every stats twice
+    // Increment every stat twice
     for (int i = 0; i < 2; i++) {
-      builder.incrementIntervalCountSkipped(13)
-             .incrementBytesSkipped(13)
-             .incrementSegmentCountSkipped(13)
-             .incrementIntervalCountCompacted(13)
-             .incrementBytesCompacted(13)
-             .incrementSegmentCountCompacted(13)
-             .incrementIntervalCountAwaitingCompaction(13)
-             .incrementBytesAwaitingCompaction(13)
-             .incrementSegmentCountAwaitingCompaction(13);
+      builder.incrementSkippedStats(CompactionStatistics.create(13, 13, 13));
+      builder.incrementWaitingStats(CompactionStatistics.create(13, 13, 13));
+      builder.incrementCompactedStats(CompactionStatistics.create(13, 13, 13));
     }
 
     final AutoCompactionSnapshot actual = builder.build();
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/compact/CompactionStatusTest.java b/server/src/test/java/org/apache/druid/server/coordinator/compact/CompactionStatusTest.java
new file mode 100644
index 00000000000..0e13f8cd0e1
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/server/coordinator/compact/CompactionStatusTest.java
@@ -0,0 +1,178 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.server.coordinator.compact;
+
+import org.apache.druid.client.indexing.ClientCompactionTaskQueryTuningConfig;
+import org.apache.druid.indexer.partitions.DimensionRangePartitionsSpec;
+import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
+import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
+import org.apache.druid.indexer.partitions.PartitionsSpec;
+import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
+import org.apache.druid.server.coordinator.UserCompactionTaskQueryTuningConfig;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Collections;
+
+public class CompactionStatusTest
+{
+  private static final String DS_WIKI = "wiki";
+
+  @Test
+  public void testFindPartitionsSpecWhenGivenIsNull()
+  {
+    final ClientCompactionTaskQueryTuningConfig tuningConfig
+        = ClientCompactionTaskQueryTuningConfig.from(null);
+    Assert.assertEquals(
+        new DynamicPartitionsSpec(null, Long.MAX_VALUE),
+        CompactionStatus.findPartitionsSpecFromConfig(tuningConfig)
+    );
+  }
+
+  @Test
+  public void testFindPartitionsSpecWhenGivenIsDynamicWithNullMaxTotalRows()
+  {
+    final PartitionsSpec partitionsSpec = new DynamicPartitionsSpec(null, null);
+    final ClientCompactionTaskQueryTuningConfig tuningConfig
+        = ClientCompactionTaskQueryTuningConfig.from(createCompactionConfig(partitionsSpec));
+    Assert.assertEquals(
+        new DynamicPartitionsSpec(null, Long.MAX_VALUE),
+        CompactionStatus.findPartitionsSpecFromConfig(tuningConfig)
+    );
+  }
+
+  @Test
+  public void testFindPartitionsSpecWhenGivenIsDynamicWithMaxTotalRows()
+  {
+    final PartitionsSpec partitionsSpec = new DynamicPartitionsSpec(null, 1000L);
+    final ClientCompactionTaskQueryTuningConfig tuningConfig
+        = ClientCompactionTaskQueryTuningConfig.from(createCompactionConfig(partitionsSpec));
+    Assert.assertEquals(
+        partitionsSpec,
+        CompactionStatus.findPartitionsSpecFromConfig(tuningConfig)
+    );
+  }
+
+  @Test
+  public void testFindPartitionsSpecWhenGivenIsDynamicWithMaxRowsPerSegment()
+  {
+    final PartitionsSpec partitionsSpec = new DynamicPartitionsSpec(100, 1000L);
+    final ClientCompactionTaskQueryTuningConfig tuningConfig
+        = ClientCompactionTaskQueryTuningConfig.from(createCompactionConfig(partitionsSpec));
+    Assert.assertEquals(
+        partitionsSpec,
+        CompactionStatus.findPartitionsSpecFromConfig(tuningConfig)
+    );
+  }
+
+  @Test
+  public void testFindPartitionsSpecFromConfigWithDeprecatedMaxRowsPerSegmentAndMaxTotalRowsReturnGivenValues()
+  {
+    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
+        "datasource",
+        null,
+        null,
+        100,
+        null,
+        new UserCompactionTaskQueryTuningConfig(
+            null,
+            null,
+            null,
+            1000L,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null,
+            null
+        ),
+        null,
+        null,
+        null,
+        null,
+        null,
+        null,
+        null
+    );
+    Assert.assertEquals(
+        new DynamicPartitionsSpec(100, 1000L),
+        CompactionStatus.findPartitionsSpecFromConfig(
+            ClientCompactionTaskQueryTuningConfig.from(config)
+        )
+    );
+  }
+
+  @Test
+  public void testFindPartitionsSpecWhenGivenIsHashed()
+  {
+    final PartitionsSpec partitionsSpec =
+        new HashedPartitionsSpec(null, 100, Collections.singletonList("dim"));
+    final ClientCompactionTaskQueryTuningConfig tuningConfig
+        = ClientCompactionTaskQueryTuningConfig.from(createCompactionConfig(partitionsSpec));
+    Assert.assertEquals(
+        partitionsSpec,
+        CompactionStatus.findPartitionsSpecFromConfig(tuningConfig)
+    );
+  }
+
+  @Test
+  public void testFindPartitionsSpecWhenGivenIsRange()
+  {
+    final PartitionsSpec partitionsSpec =
+        new DimensionRangePartitionsSpec(null, 10000, Collections.singletonList("dim"), false);
+    final ClientCompactionTaskQueryTuningConfig tuningConfig
+        = ClientCompactionTaskQueryTuningConfig.from(createCompactionConfig(partitionsSpec));
+    Assert.assertEquals(
+        partitionsSpec,
+        CompactionStatus.findPartitionsSpecFromConfig(tuningConfig)
+    );
+  }
+
+  private static DataSourceCompactionConfig createCompactionConfig(
+      PartitionsSpec partitionsSpec
+  )
+  {
+    return new DataSourceCompactionConfig(
+        DS_WIKI,
+        null, null, null, null, createTuningConfig(partitionsSpec),
+        null, null, null, null, null, null, null
+    );
+  }
+
+  private static UserCompactionTaskQueryTuningConfig createTuningConfig(
+      PartitionsSpec partitionsSpec
+  )
+  {
+    return new UserCompactionTaskQueryTuningConfig(
+        null,
+        null, null, null, null, partitionsSpec, null, null, null,
+        null, null, null, null, null, null, null, null, null, null
+    );
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/compact/DataSourceCompactibleSegmentIteratorTest.java b/server/src/test/java/org/apache/druid/server/coordinator/compact/DataSourceCompactibleSegmentIteratorTest.java
new file mode 100644
index 00000000000..a2765ccfc09
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/server/coordinator/compact/DataSourceCompactibleSegmentIteratorTest.java
@@ -0,0 +1,77 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.server.coordinator.compact;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.Lists;
+import org.apache.druid.java.util.common.DateTimes;
+import org.apache.druid.java.util.common.Intervals;
+import org.joda.time.Interval;
+import org.joda.time.Period;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.List;
+
+public class DataSourceCompactibleSegmentIteratorTest
+{
+  @Test
+  public void testFilterSkipIntervals()
+  {
+    final Interval totalInterval = Intervals.of("2018-01-01/2019-01-01");
+    final List<Interval> expectedSkipIntervals = ImmutableList.of(
+        Intervals.of("2018-01-15/2018-03-02"),
+        Intervals.of("2018-07-23/2018-10-01"),
+        Intervals.of("2018-10-02/2018-12-25"),
+        Intervals.of("2018-12-31/2019-01-01")
+    );
+    final List<Interval> skipIntervals = DataSourceCompactibleSegmentIterator.filterSkipIntervals(
+        totalInterval,
+        Lists.newArrayList(
+            Intervals.of("2017-12-01/2018-01-15"),
+            Intervals.of("2018-03-02/2018-07-23"),
+            Intervals.of("2018-10-01/2018-10-02"),
+            Intervals.of("2018-12-25/2018-12-31")
+        )
+    );
+
+    Assert.assertEquals(expectedSkipIntervals, skipIntervals);
+  }
+
+  @Test
+  public void testAddSkipIntervalFromLatestAndSort()
+  {
+    final List<Interval> expectedIntervals = ImmutableList.of(
+        Intervals.of("2018-12-24/2018-12-25"),
+        Intervals.of("2018-12-29/2019-01-01")
+    );
+    final List<Interval> fullSkipIntervals = DataSourceCompactibleSegmentIterator.sortAndAddSkipIntervalFromLatest(
+        DateTimes.of("2019-01-01"),
+        new Period(72, 0, 0, 0),
+        null,
+        ImmutableList.of(
+            Intervals.of("2018-12-30/2018-12-31"),
+            Intervals.of("2018-12-24/2018-12-25")
+        )
+    );
+
+    Assert.assertEquals(expectedIntervals, fullSkipIntervals);
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIteratorTest.java b/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIteratorTest.java
deleted file mode 100644
index 9c96e6fcdd8..00000000000
--- a/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstIteratorTest.java
+++ /dev/null
@@ -1,477 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *   http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied.  See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
-
-package org.apache.druid.server.coordinator.compact;
-
-import com.google.common.collect.ImmutableList;
-import com.google.common.collect.Lists;
-import org.apache.druid.client.indexing.ClientCompactionTaskQueryTuningConfig;
-import org.apache.druid.indexer.partitions.DynamicPartitionsSpec;
-import org.apache.druid.indexer.partitions.HashedPartitionsSpec;
-import org.apache.druid.indexer.partitions.SingleDimensionPartitionsSpec;
-import org.apache.druid.java.util.common.DateTimes;
-import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.server.coordinator.DataSourceCompactionConfig;
-import org.apache.druid.server.coordinator.UserCompactionTaskQueryTuningConfig;
-import org.joda.time.Interval;
-import org.joda.time.Period;
-import org.junit.Assert;
-import org.junit.Test;
-
-import java.util.List;
-
-public class NewestSegmentFirstIteratorTest
-{
-  @Test
-  public void testFilterSkipIntervals()
-  {
-    final Interval totalInterval = Intervals.of("2018-01-01/2019-01-01");
-    final List<Interval> expectedSkipIntervals = ImmutableList.of(
-        Intervals.of("2018-01-15/2018-03-02"),
-        Intervals.of("2018-07-23/2018-10-01"),
-        Intervals.of("2018-10-02/2018-12-25"),
-        Intervals.of("2018-12-31/2019-01-01")
-    );
-    final List<Interval> skipIntervals = NewestSegmentFirstIterator.filterSkipIntervals(
-        totalInterval,
-        Lists.newArrayList(
-            Intervals.of("2017-12-01/2018-01-15"),
-            Intervals.of("2018-03-02/2018-07-23"),
-            Intervals.of("2018-10-01/2018-10-02"),
-            Intervals.of("2018-12-25/2018-12-31")
-        )
-    );
-
-    Assert.assertEquals(expectedSkipIntervals, skipIntervals);
-  }
-
-  @Test
-  public void testAddSkipIntervalFromLatestAndSort()
-  {
-    final List<Interval> expectedIntervals = ImmutableList.of(
-        Intervals.of("2018-12-24/2018-12-25"),
-        Intervals.of("2018-12-29/2019-01-01")
-    );
-    final List<Interval> fullSkipIntervals = NewestSegmentFirstIterator.sortAndAddSkipIntervalFromLatest(
-        DateTimes.of("2019-01-01"),
-        new Period(72, 0, 0, 0),
-        null,
-        ImmutableList.of(
-            Intervals.of("2018-12-30/2018-12-31"),
-            Intervals.of("2018-12-24/2018-12-25")
-        )
-    );
-
-    Assert.assertEquals(expectedIntervals, fullSkipIntervals);
-  }
-
-  @Test
-  public void testFindPartitionsSpecFromConfigWithNullTuningConfigReturnDynamicPartitinosSpecWithMaxTotalRowsOfLongMax()
-  {
-    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
-        "datasource",
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    Assert.assertEquals(
-        new DynamicPartitionsSpec(null, Long.MAX_VALUE),
-        CompactionStatus.findPartitionsSpecFromConfig(
-            ClientCompactionTaskQueryTuningConfig.from(config.getTuningConfig(), config.getMaxRowsPerSegment(), null)
-        )
-    );
-  }
-
-  @Test
-  public void testFindPartitionsSpecFromConfigWithNullMaxTotalRowsReturnLongMaxValue()
-  {
-    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
-        "datasource",
-        null,
-        null,
-        null,
-        null,
-        new UserCompactionTaskQueryTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            new DynamicPartitionsSpec(null, null),
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    Assert.assertEquals(
-        new DynamicPartitionsSpec(null, Long.MAX_VALUE),
-        CompactionStatus.findPartitionsSpecFromConfig(
-            ClientCompactionTaskQueryTuningConfig.from(config.getTuningConfig(), config.getMaxRowsPerSegment(), null)
-        )
-    );
-  }
-
-  @Test
-  public void testFindPartitionsSpecFromConfigWithNonNullMaxTotalRowsReturnGivenValue()
-  {
-    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
-        "datasource",
-        null,
-        null,
-        null,
-        null,
-        new UserCompactionTaskQueryTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            new DynamicPartitionsSpec(null, 1000L),
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    Assert.assertEquals(
-        new DynamicPartitionsSpec(null, 1000L),
-        CompactionStatus.findPartitionsSpecFromConfig(
-            ClientCompactionTaskQueryTuningConfig.from(config.getTuningConfig(), config.getMaxRowsPerSegment(), null)
-        )
-    );
-  }
-
-  @Test
-  public void testFindPartitionsSpecFromConfigWithNonNullMaxRowsPerSegmentReturnGivenValue()
-  {
-    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
-        "datasource",
-        null,
-        null,
-        null,
-        null,
-        new UserCompactionTaskQueryTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            new DynamicPartitionsSpec(100, 1000L),
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    Assert.assertEquals(
-        new DynamicPartitionsSpec(100, 1000L),
-        CompactionStatus.findPartitionsSpecFromConfig(
-            ClientCompactionTaskQueryTuningConfig.from(config.getTuningConfig(), config.getMaxRowsPerSegment(), null)
-        )
-    );
-  }
-
-  @Test
-  public void testFindPartitionsSpecFromConfigWithDeprecatedMaxRowsPerSegmentAndMaxTotalRowsReturnGivenValues()
-  {
-    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
-        "datasource",
-        null,
-        null,
-        100,
-        null,
-        new UserCompactionTaskQueryTuningConfig(
-            null,
-            null,
-            null,
-            1000L,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    Assert.assertEquals(
-        new DynamicPartitionsSpec(100, 1000L),
-        CompactionStatus.findPartitionsSpecFromConfig(
-            ClientCompactionTaskQueryTuningConfig.from(config.getTuningConfig(), config.getMaxRowsPerSegment(), null)
-        )
-    );
-  }
-
-  @Test
-  public void testFindPartitionsSpecFromConfigWithDeprecatedMaxRowsPerSegmentAndPartitionsSpecIgnoreDeprecatedOne()
-  {
-    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
-        "datasource",
-        null,
-        null,
-        100,
-        null,
-        new UserCompactionTaskQueryTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            new DynamicPartitionsSpec(null, null),
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    Assert.assertEquals(
-        new DynamicPartitionsSpec(null, Long.MAX_VALUE),
-        CompactionStatus.findPartitionsSpecFromConfig(
-            ClientCompactionTaskQueryTuningConfig.from(config.getTuningConfig(), config.getMaxRowsPerSegment(), null)
-        )
-    );
-  }
-
-  @Test
-  public void testFindPartitionsSpecFromConfigWithDeprecatedMaxTotalRowsAndPartitionsSpecIgnoreDeprecatedOne()
-  {
-    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
-        "datasource",
-        null,
-        null,
-        null,
-        null,
-        new UserCompactionTaskQueryTuningConfig(
-            null,
-            null,
-            null,
-            1000L,
-            null,
-            new DynamicPartitionsSpec(null, null),
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    Assert.assertEquals(
-        new DynamicPartitionsSpec(null, Long.MAX_VALUE),
-        CompactionStatus.findPartitionsSpecFromConfig(
-            ClientCompactionTaskQueryTuningConfig.from(config.getTuningConfig(), config.getMaxRowsPerSegment(), null)
-        )
-    );
-  }
-
-  @Test
-  public void testFindPartitionsSpecFromConfigWithHashPartitionsSpec()
-  {
-    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
-        "datasource",
-        null,
-        null,
-        null,
-        null,
-        new UserCompactionTaskQueryTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            new HashedPartitionsSpec(null, 10, ImmutableList.of("dim")),
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    Assert.assertEquals(
-        new HashedPartitionsSpec(null, 10, ImmutableList.of("dim")),
-        CompactionStatus.findPartitionsSpecFromConfig(
-            ClientCompactionTaskQueryTuningConfig.from(config.getTuningConfig(), config.getMaxRowsPerSegment(), null)
-        )
-    );
-  }
-
-  @Test
-  public void testFindPartitionsSpecFromConfigWithRangePartitionsSpec()
-  {
-    final DataSourceCompactionConfig config = new DataSourceCompactionConfig(
-        "datasource",
-        null,
-        null,
-        null,
-        null,
-        new UserCompactionTaskQueryTuningConfig(
-            null,
-            null,
-            null,
-            null,
-            null,
-            new SingleDimensionPartitionsSpec(10000, null, "dim", false),
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null,
-            null
-        ),
-        null,
-        null,
-        null,
-        null,
-        null,
-        null,
-        null
-    );
-    Assert.assertEquals(
-        new SingleDimensionPartitionsSpec(10000, null, "dim", false),
-        CompactionStatus.findPartitionsSpecFromConfig(
-            ClientCompactionTaskQueryTuningConfig.from(config.getTuningConfig(), config.getMaxRowsPerSegment(), null)
-        )
-    );
-  }
-}
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicyTest.java b/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicyTest.java
index 31e269f50f4..8f24a4ebb7e 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicyTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/compact/NewestSegmentFirstPolicyTest.java
@@ -88,7 +88,7 @@ public class NewestSegmentFirstPolicyTest
   public void testLargeOffsetAndSmallSegmentInterval()
   {
     final Period segmentPeriod = new Period("PT1H");
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(10000, new Period("P2D"), null)),
         ImmutableMap.of(
             DATA_SOURCE,
@@ -113,7 +113,7 @@ public class NewestSegmentFirstPolicyTest
   public void testSmallOffsetAndLargeSegmentInterval()
   {
     final Period segmentPeriod = new Period("PT1H");
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(10000, new Period("PT1M"), null)),
         ImmutableMap.of(
             DATA_SOURCE,
@@ -146,7 +146,7 @@ public class NewestSegmentFirstPolicyTest
   public void testLargeGapInData()
   {
     final Period segmentPeriod = new Period("PT1H");
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(10000, new Period("PT1H1M"), null)),
         ImmutableMap.of(
             DATA_SOURCE,
@@ -179,7 +179,7 @@ public class NewestSegmentFirstPolicyTest
   @Test
   public void testHugeShard()
   {
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(10000, new Period("P1D"), null)),
         ImmutableMap.of(
             DATA_SOURCE,
@@ -229,7 +229,7 @@ public class NewestSegmentFirstPolicyTest
   @Test
   public void testManySegmentsPerShard()
   {
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(800000, new Period("P1D"), null)),
         ImmutableMap.of(
             DATA_SOURCE,
@@ -287,7 +287,7 @@ public class NewestSegmentFirstPolicyTest
   {
     final String unknownDataSource = "unknown";
     final Period segmentPeriod = new Period("PT1H");
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(
             unknownDataSource,
             createCompactionConfig(10000, new Period("P2D"), null),
@@ -337,7 +337,7 @@ public class NewestSegmentFirstPolicyTest
             2
         )
     );
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(inputSegmentSizeBytes, new Period("P0D"), null)),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -374,7 +374,7 @@ public class NewestSegmentFirstPolicyTest
         )
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(40000, new Period("P1D"), null)),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -395,7 +395,7 @@ public class NewestSegmentFirstPolicyTest
         )
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(40000, new Period("P1D"), null)),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -412,7 +412,7 @@ public class NewestSegmentFirstPolicyTest
         new SegmentGenerateSpec(Intervals.of("2017-10-14T00:00:00/2017-10-15T00:00:00"), new Period("P1D"))
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(40000, new Period("P1D"), new UserCompactionTaskGranularityConfig(Granularities.DAY, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -445,7 +445,7 @@ public class NewestSegmentFirstPolicyTest
         new SegmentGenerateSpec(Intervals.of("2017-10-14T00:00:00/2017-10-15T00:00:00"), new Period("PT5H"))
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(40000, new Period("P1D"), new UserCompactionTaskGranularityConfig(Granularities.MONTH, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -471,7 +471,7 @@ public class NewestSegmentFirstPolicyTest
         new SegmentGenerateSpec(Intervals.of("2017-10-14T00:00:00/2017-10-15T00:00:00"), new Period("PT5H"))
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(40000, new Period("P1D"), new UserCompactionTaskGranularityConfig(Granularities.MINUTE, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -496,7 +496,7 @@ public class NewestSegmentFirstPolicyTest
   public void testWithSkipIntervals()
   {
     final Period segmentPeriod = new Period("PT1H");
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(10000, new Period("P1D"), null)),
         ImmutableMap.of(
             DATA_SOURCE,
@@ -536,7 +536,7 @@ public class NewestSegmentFirstPolicyTest
   public void testHoleInSearchInterval()
   {
     final Period segmentPeriod = new Period("PT1H");
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(10000, new Period("PT1H"), null)),
         ImmutableMap.of(
             DATA_SOURCE,
@@ -586,7 +586,7 @@ public class NewestSegmentFirstPolicyTest
         new SegmentGenerateSpec(Intervals.of("2017-10-01T00:00:00/2017-12-31T00:00:00"), new Period("P1D"))
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(Granularities.MONTH, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -635,7 +635,7 @@ public class NewestSegmentFirstPolicyTest
         new SegmentGenerateSpec(Intervals.of("2020-02-08/2020-02-15"), new Period("P7D"))
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(Granularities.MONTH, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -670,7 +670,7 @@ public class NewestSegmentFirstPolicyTest
         new SegmentGenerateSpec(Intervals.of("2017-12-01T00:00:00/2017-12-02T00:00:00"), new Period("P1D"))
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(40000, new Period("P0D"), new UserCompactionTaskGranularityConfig(Granularities.MINUTE, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -696,7 +696,7 @@ public class NewestSegmentFirstPolicyTest
         new SegmentGenerateSpec(Intervals.of("2017-10-01T01:00:00/2017-10-01T02:00:00"), new Period("PT1H"), "1994-04-30T00:00:00.000Z", null)
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(Granularities.MONTH, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -721,7 +721,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have segmentGranularity=DAY
     final SegmentTimeline timeline = createTimeline(
@@ -740,7 +740,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Auto compaction config sets segmentGranularity=DAY
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(Granularities.DAY, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -754,7 +754,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have segmentGranularity=DAY
     final SegmentTimeline timeline = createTimeline(
@@ -773,7 +773,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Auto compaction config sets segmentGranularity=DAY
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(Granularities.DAY, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -787,7 +787,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have segmentGranularity=DAY
     final SegmentTimeline timeline = createTimeline(
@@ -806,7 +806,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Auto compaction config sets segmentGranularity=YEAR
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(Granularities.YEAR, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -830,7 +830,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have segmentGranularity=DAY
     final SegmentTimeline timeline = createTimeline(
@@ -849,7 +849,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Auto compaction config sets segmentGranularity=YEAR
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(Granularities.YEAR, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -873,7 +873,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have segmentGranularity=DAY
     final SegmentTimeline timeline = createTimeline(
@@ -887,7 +887,7 @@ public class NewestSegmentFirstPolicyTest
 
     // Duration of new segmentGranularity is the same as before (P1D),
     // but we changed the timezone from UTC to Bangkok in the auto compaction spec
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(
                             130000,
@@ -925,7 +925,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have segmentGranularity=DAY
     final SegmentTimeline timeline = createTimeline(
@@ -938,7 +938,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Duration of new segmentGranularity is the same as before (P1D), but we changed the origin in the autocompaction spec
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(
                             130000,
@@ -976,7 +976,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have
     // rollup=false for interval 2017-10-01T00:00:00/2017-10-02T00:00:00,
@@ -1004,7 +1004,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Auto compaction config sets rollup=true
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(null, null, true))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -1036,7 +1036,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have
     // queryGranularity=DAY for interval 2017-10-01T00:00:00/2017-10-02T00:00:00,
@@ -1064,7 +1064,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Auto compaction config sets queryGranularity=MINUTE
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(null, Granularities.MINUTE, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -1096,7 +1096,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have
     // Dimensions=["foo", "bar"] for interval 2017-10-01T00:00:00/2017-10-02T00:00:00,
@@ -1131,7 +1131,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Auto compaction config sets Dimensions=["foo"]
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(
             130000,
             new Period("P0D"),
@@ -1172,7 +1172,7 @@ public class NewestSegmentFirstPolicyTest
     Assert.assertFalse(iterator.hasNext());
 
     // Auto compaction config sets Dimensions=null
-    iterator = policy.reset(
+    iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(
             130000,
             new Period("P0D"),
@@ -1195,7 +1195,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have
     // filter=SelectorDimFilter("dim1", "foo", null) for interval 2017-10-01T00:00:00/2017-10-02T00:00:00,
@@ -1251,7 +1251,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Auto compaction config sets filter=SelectorDimFilter("dim1", "bar", null)
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(
             130000,
             new Period("P0D"),
@@ -1292,7 +1292,7 @@ public class NewestSegmentFirstPolicyTest
     Assert.assertFalse(iterator.hasNext());
 
     // Auto compaction config sets filter=null
-    iterator = policy.reset(
+    iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(
             130000,
             new Period("P0D"),
@@ -1319,7 +1319,7 @@ public class NewestSegmentFirstPolicyTest
     // Same indexSpec as what is set in the auto compaction config
     Map<String, Object> indexSpec = IndexSpec.DEFAULT.asMap(mapper);
     // Same partitionsSpec as what is set in the auto compaction config
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have
     // metricsSpec={CountAggregatorFactory("cnt")} for interval 2017-10-01T00:00:00/2017-10-02T00:00:00,
@@ -1375,7 +1375,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Auto compaction config sets metricsSpec={CountAggregatorFactory("cnt"), LongSumAggregatorFactory("val", "val")}
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(
             130000,
             new Period("P0D"),
@@ -1416,7 +1416,7 @@ public class NewestSegmentFirstPolicyTest
     Assert.assertFalse(iterator.hasNext());
 
     // Auto compaction config sets metricsSpec=null
-    iterator = policy.reset(
+    iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(
             130000,
             new Period("P0D"),
@@ -1440,7 +1440,7 @@ public class NewestSegmentFirstPolicyTest
         new SegmentGenerateSpec(Intervals.of("2017-10-01T01:00:00/2017-10-01T02:00:00"), new Period("PT1H"), "1994-04-30T00:00:00.000Z", null)
     );
 
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(130000, new Period("P0D"), new UserCompactionTaskGranularityConfig(Granularities.HOUR, null, null))),
         ImmutableMap.of(DATA_SOURCE, timeline),
         Collections.emptyMap()
@@ -1468,7 +1468,7 @@ public class NewestSegmentFirstPolicyTest
     // Different indexSpec as what is set in the auto compaction config
     IndexSpec newIndexSpec = IndexSpec.builder().withBitmapSerdeFactory(new ConciseBitmapSerdeFactory()).build();
     Map<String, Object> newIndexSpecMap = mapper.convertValue(newIndexSpec, new TypeReference<Map<String, Object>>() {});
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
 
     // Create segments that were compacted (CompactionState != null) and have segmentGranularity=DAY
     final SegmentTimeline timeline = createTimeline(
@@ -1481,7 +1481,7 @@ public class NewestSegmentFirstPolicyTest
     );
 
     // Duration of new segmentGranularity is the same as before (P1D)
-    final CompactionSegmentIterator iterator = policy.reset(
+    final CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(
                             130000,
@@ -1517,7 +1517,7 @@ public class NewestSegmentFirstPolicyTest
   public void testIteratorDoesNotReturnSegmentWithChangingAppendableIndexSpec()
   {
     NullHandling.initializeForTests();
-    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null, null, null));
+    PartitionsSpec partitionsSpec = CompactionStatus.findPartitionsSpecFromConfig(ClientCompactionTaskQueryTuningConfig.from(null));
     final SegmentTimeline timeline = createTimeline(
         new SegmentGenerateSpec(
             Intervals.of("2017-10-01T00:00:00/2017-10-02T00:00:00"),
@@ -1534,7 +1534,7 @@ public class NewestSegmentFirstPolicyTest
         )
     );
 
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(
             130000,
             new Period("P0D"),
@@ -1569,7 +1569,7 @@ public class NewestSegmentFirstPolicyTest
     );
     Assert.assertFalse(iterator.hasNext());
 
-    iterator = policy.reset(
+    iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE, createCompactionConfig(
             130000,
             new Period("P0D"),
@@ -1608,7 +1608,7 @@ public class NewestSegmentFirstPolicyTest
   @Test
   public void testSkipAllGranularityToDefault()
   {
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(10000,
                                                new Period("P0D"),
@@ -1640,7 +1640,7 @@ public class NewestSegmentFirstPolicyTest
   @Test
   public void testSkipFirstHalfEternityToDefault()
   {
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(10000,
                                                new Period("P0D"),
@@ -1672,7 +1672,7 @@ public class NewestSegmentFirstPolicyTest
   @Test
   public void testSkipSecondHalfOfEternityToDefault()
   {
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(10000,
                                                new Period("P0D"),
@@ -1704,7 +1704,7 @@ public class NewestSegmentFirstPolicyTest
   @Test
   public void testSkipAllToAllGranularity()
   {
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(10000,
                                                new Period("P0D"),
@@ -1736,7 +1736,7 @@ public class NewestSegmentFirstPolicyTest
   @Test
   public void testSkipAllToFinerGranularity()
   {
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(10000,
                                                new Period("P0D"),
@@ -1799,7 +1799,7 @@ public class NewestSegmentFirstPolicyTest
         0,
         1);
 
-    CompactionSegmentIterator iterator = policy.reset(
+    CompactionSegmentIterator iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(10000,
                                                new Period("P0D"),
@@ -1850,7 +1850,7 @@ public class NewestSegmentFirstPolicyTest
         TombstoneShardSpec.INSTANCE,
         0,
         1);
-    iterator = policy.reset(
+    iterator = policy.createIterator(
         ImmutableMap.of(DATA_SOURCE,
                         createCompactionConfig(10000,
                                                new Period("P0D"),