diff --git a/.github/scripts/display_dependency_analysis_error_message.sh b/.github/scripts/analyze_dependencies_script.sh
similarity index 92%
rename from .github/scripts/display_dependency_analysis_error_message.sh
rename to .github/scripts/analyze_dependencies_script.sh
index 3899d5917b15..c92d90030f71 100755
--- a/.github/scripts/display_dependency_analysis_error_message.sh
+++ b/.github/scripts/analyze_dependencies_script.sh
@@ -13,6 +13,9 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+#!bin/bash
+
+${MVN} ${MAVEN_SKIP} dependency:analyze -DoutputXML=true -DignoreNonCompile=true -DfailOnWarning=true ${HADOOP_PROFILE} ||
 { echo "
     The dependency analysis has found a dependency that is either:
 
diff --git a/.github/scripts/license_checks_script.sh b/.github/scripts/license_checks_script.sh
new file mode 100755
index 000000000000..410ac60375fa
--- /dev/null
+++ b/.github/scripts/license_checks_script.sh
@@ -0,0 +1,27 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#!/bin/bash
+
+set -e
+
+./.github/scripts/setup_generate_license.sh
+${MVN} apache-rat:check -Prat --fail-at-end \
+-Dorg.slf4j.simpleLogger.log.org.apache.maven.cli.transfer.Slf4jMavenTransferListener=warn \
+-Drat.consoleOutput=true ${HADOOP_PROFILE}
+# Generate dependency reports and checks they are valid.
+mkdir -p target
+distribution/bin/generate-license-dependency-reports.py . target --clean-maven-artifact-transfer --parallel 2
+distribution/bin/check-licenses.py licenses.yaml target/license-reports
diff --git a/.github/scripts/setup_generate_license.sh b/.github/scripts/setup_generate_license.sh
index 9e6c2eae68c6..71583bfb2b26 100755
--- a/.github/scripts/setup_generate_license.sh
+++ b/.github/scripts/setup_generate_license.sh
@@ -13,6 +13,10 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+#!/bin/bash
+
+set -e
+
 sudo apt-get update && sudo apt-get install python3 -y
 curl https://bootstrap.pypa.io/pip/3.5/get-pip.py | sudo -H python3
 pip3 install wheel  # install wheel first explicitly
diff --git a/.github/workflows/static-checks.yml b/.github/workflows/static-checks.yml
index 7f4437f0129e..37e7a2225857 100644
--- a/.github/workflows/static-checks.yml
+++ b/.github/workflows/static-checks.yml
@@ -35,160 +35,139 @@ env:
   MAVEN_OPTS: -Xmx3000m
 
 jobs:
-  build:
+  static-checks:
+    strategy:
+      matrix:
+        java: [ 'jdk8', 'jdk11', 'jdk17' ]
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v3
-      - name: setup java 8
+      - name: checkout branch
+        uses: actions/checkout@v3
+
+      - name: set java version
+        run: |
+          export jdk=${{ matrix.java }}
+          echo "java_version=${jdk:3}" >> $GITHUB_ENV
+
+      - name: setup ${{ matrix.java }}
         uses: actions/setup-java@v3
         with:
           distribution: 'zulu'
-          java-version: '8'
+          java-version: ${{ env.java_version }}
           cache: 'maven'
-      - run: |
+
+      - name: packaging check
+        run: |
+          ./.github/scripts/setup_generate_license.sh
+          ${MVN} clean install -Prat -Pdist -Pbundle-contrib-exts --fail-at-end \
+          -pl '!benchmarks' ${MAVEN_SKIP} ${MAVEN_SKIP_TESTS} -Dweb.console.skip=false -T1C
+
+      - name: script checks
+        # who watches the watchers?
+        if: ${{ matrix.java == 'jdk8' }}
+        run: ./check_test_suite_test.py
+
+      - name: (openjdk11) strict compilation
+        if: ${{ matrix.java == 'jdk11' }}
+        # errorprone requires JDK 11
+        # Strict compilation requires more than 2 GB
+        run: ${MVN} clean -DstrictCompile compile test-compile --fail-at-end ${MAVEN_SKIP} ${MAVEN_SKIP_TESTS}
+
+      - name: maven install
+        if: ${{ matrix.java == 'jdk8' }}
+        run: |
           echo 'Running Maven install...' &&
           ${MVN} clean install -q -ff -pl '!distribution,!:druid-it-image,!:druid-it-cases' ${MAVEN_SKIP} ${MAVEN_SKIP_TESTS} -T1C &&
           ${MVN} install -q -ff -pl 'distribution' ${MAVEN_SKIP} ${MAVEN_SKIP_TESTS}
 
-  animal_sniffer_checks:
-    runs-on: ubuntu-latest
-    needs: [build]
-    steps:
-      - uses: actions/checkout@v3
-      - name: setup java 8
-        uses: actions/setup-java@v3
-        with:
-          distribution: 'zulu'
-          java-version: '8'
-          cache: 'maven'
-      - run: ${MVN} animal-sniffer:check --fail-at-end
+      - name: license checks
+        if: ${{ matrix.java == 'jdk8' }}
+        run: ./.github/scripts/license_checks_script.sh
 
-  checkstyle:
-    runs-on: ubuntu-latest
-    needs: [build]
-    steps:
-      - uses: actions/checkout@v3
-      - name: setup java 8
-        uses: actions/setup-java@v3
-        with:
-          distribution: 'zulu'
-          java-version: '8'
-          cache: 'maven'
-      - run: ${MVN} checkstyle:checkstyle --fail-at-end
+      - name: license checks for hadoop3
+        if: ${{ matrix.java == 'jdk8' }}
+        env:
+          HADOOP_PROFILE: -Phadoop3
+        run: ./.github/scripts/license_checks_script.sh
 
-  enforcer_checks:
-    runs-on: ubuntu-latest
-    needs: [build]
-    steps:
-      - uses: actions/checkout@v3
-      - name: setup java 8
-        uses: actions/setup-java@v3
-        with:
-          distribution: 'zulu'
-          java-version: '8'
-          cache: 'maven'
-      - run: ${MVN} enforcer:enforce --fail-at-end
+      - name: analyze dependencies
+        if: ${{ matrix.java == 'jdk8' }}
+        run: |
+          ./.github/scripts/analyze_dependencies_script.sh
 
-  forbidden_api_checks:
-    runs-on: ubuntu-latest
-    needs: [build]
-    steps:
-      - uses: actions/checkout@v3
-      - name: setup java 8
-        uses: actions/setup-java@v3
-        with:
-          distribution: 'zulu'
-          java-version: '8'
-          cache: 'maven'
-      - run: ${MVN} forbiddenapis:check forbiddenapis:testCheck --fail-at-end
+      - name: analyze dependencies for hadoop3
+        if: ${{ matrix.java == 'jdk8' }}
+        env:
+          HADOOP_PROFILE: -Phadoop3
+        run: |
+          ./.github/scripts/analyze_dependencies_script.sh
 
-  pmd_checks:
-    runs-on: ubuntu-latest
-    needs: [build]
-    steps:
-      - uses: actions/checkout@v3
-      - name: setup java 8
-        uses: actions/setup-java@v3
-        with:
-          distribution: 'zulu'
-          java-version: '8'
-          cache: 'maven'
-      - run: ${MVN} pmd:check --fail-at-end  # TODO: consider adding pmd:cpd-check
+      - name: animal sniffer checks
+        if: ${{ matrix.java == 'jdk8' }}
+        run: ${MVN} animal-sniffer:check --fail-at-end
 
-  spotbugs_checks:
-    runs-on: ubuntu-latest
-    needs: [build]
-    steps:
-      - uses: actions/checkout@v3
-      - name: setup java 8
-        uses: actions/setup-java@v3
-        with:
-          distribution: 'zulu'
-          java-version: '8'
-          cache: 'maven'
-      - run: ${MVN} spotbugs:check --fail-at-end -pl '!benchmarks'
+      - name: checkstyle
+        if: ${{ matrix.java == 'jdk8' }}
+        run: ${MVN} checkstyle:checkstyle --fail-at-end
 
-  license_checks:
-    runs-on: ubuntu-latest
-    needs: [build]
-    strategy:
-      matrix:
-        HADOOP_PROFILE: ['', '-Phadoop3']
-    steps:
-      - uses: actions/checkout@v3
-      - name: setup java 8
-        uses: actions/setup-java@v3
-        with:
-          distribution: 'zulu'
-          java-version: '8'
-          cache: 'maven'
-      - run: |
-          ./.github/scripts/setup_generate_license.sh
-          ${MVN} apache-rat:check -Prat --fail-at-end \
-          -Dorg.slf4j.simpleLogger.log.org.apache.maven.cli.transfer.Slf4jMavenTransferListener=warn \
-          -Drat.consoleOutput=true ${{ matrix.HADOOP_PROFILE }}
-          # Generate dependency reports and checks they are valid.
-          mkdir -p target
-          distribution/bin/generate-license-dependency-reports.py . target --clean-maven-artifact-transfer --parallel 2
-          distribution/bin/check-licenses.py licenses.yaml target/license-reports
-
-  script_checks:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v3
-        # who watches the watchers?
-      - run: ./check_test_suite_test.py
+      - name: enforcer checks
+        if: ${{ matrix.java == 'jdk8' }}
+        run: ${MVN} enforcer:enforce --fail-at-end
 
-  analyze_dependencies:
-    runs-on: ubuntu-latest
-    needs: [build]
-    strategy:
-      matrix:
-        HADOOP_PROFILE: [ '', '-Phadoop3' ]
-    steps:
-      - uses: actions/checkout@v3
-      - name: setup java 8
-        uses: actions/setup-java@v3
-        with:
-          distribution: 'zulu'
-          java-version: '8'
-          cache: 'maven'
-      - run: |-
-          ${MVN} ${MAVEN_SKIP} dependency:analyze -DoutputXML=true -DignoreNonCompile=true -DfailOnWarning=true ${{ matrix.HADOOP_PROFILE }} ||
-          ./.github/scripts/display_dependency_analysis_error_message.sh
+      - name: forbidden api checks
+        if: ${{ matrix.java == 'jdk8' }}
+        run: ${MVN} forbiddenapis:check forbiddenapis:testCheck --fail-at-end
 
-  openjdk11_strict_compilation:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v3
-      - name: setup java 11
-        uses: actions/setup-java@v3
+      - name: pmd checks
+        if: ${{ matrix.java == 'jdk8' }}
+        run: ${MVN} pmd:check --fail-at-end  # TODO: consider adding pmd:cpd-check
+
+      - name: spotbugs checks
+        if: ${{ matrix.java == 'jdk8' }}
+        run: ${MVN} spotbugs:check --fail-at-end -pl '!benchmarks'
+
+      - name: intellij inspections
+        if: ${{ matrix.java == 'jdk8' }}
+        run: |
+          docker run --rm \
+          -v $(pwd):/project \
+          -v ~/.m2:/home/inspect/.m2 \
+          ccaominh/intellij-inspect:1.0.0 \
+          /project/pom.xml \
+          /project/.idea/inspectionProfiles/Druid.xml \
+          --levels ERROR \
+          --scope JavaInspectionsScope
+
+      - name: setup node
+        if: ${{ matrix.java == 'jdk8' }}
+        uses: actions/setup-node@v3
         with:
-          distribution: 'zulu'
-          java-version: '11'
-          cache: 'maven'
+          node-version: 16.17.0
 
-        # errorprone requires JDK 11
-        # Strict compilation requires more than 2 GB
-      - run: |
-          ${MVN} clean -DstrictCompile compile test-compile --fail-at-end ${MAVEN_SKIP} ${MAVEN_SKIP_TESTS}
+      - name: docs
+        if: ${{ matrix.java == 'jdk8' }}
+        run: |
+          (cd website && npm install)
+          cd website
+          npm run link-lint
+          npm run spellcheck
+
+      - name: web console
+        if: ${{ matrix.java == 'jdk8' }}
+        run: |
+          ${MVN} test -pl 'web-console'
+          cd web-console
+          { for i in 1 2 3; do npm run codecov && break || sleep 15; done }
+
+      - name: web console end-to-end test
+        if: ${{ matrix.java == 'jdk8' }}
+        run: |
+          ./.github/scripts/setup_generate_license.sh
+          sudo apt-get update && sudo apt-get install python3 -y
+          curl https://bootstrap.pypa.io/pip/3.5/get-pip.py | sudo -H python3
+          pip3 install wheel  # install wheel first explicitly
+          pip3 install --upgrade pyyaml
+          web-console/script/druid build
+          web-console/script/druid start
+          (cd web-console && npm run test-e2e)
+          web-console/script/druid stop
diff --git a/.travis.yml b/.travis.yml
index 750d9e7ce3b6..0c7a73290b1d 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -70,120 +70,6 @@ stages:
 
 jobs:
   include:
-    - name: "animal sniffer checks"
-      stage: Tests - phase 1
-      script: ${MVN} animal-sniffer:check --fail-at-end
-
-    - name: "checkstyle"
-      script: ${MVN} checkstyle:checkstyle --fail-at-end
-
-    - name: "enforcer checks"
-      script: ${MVN} enforcer:enforce --fail-at-end
-
-    - name: "forbidden api checks"
-      script: ${MVN} forbiddenapis:check forbiddenapis:testCheck --fail-at-end
-
-    - name: "pmd checks"
-      script: ${MVN} pmd:check --fail-at-end  # TODO: consider adding pmd:cpd-check
-
-    - name: "spotbugs checks"
-      script: ${MVN} spotbugs:check --fail-at-end -pl '!benchmarks'
-
-    - &license_checks
-      name: "license checks"
-      before_script: &setup_generate_license
-        - sudo apt-get update && sudo apt-get install python3 -y
-        - curl https://bootstrap.pypa.io/pip/3.5/get-pip.py | sudo -H python3
-        - ./check_test_suite.py && travis_terminate 0 || echo 'Continuing setup'
-        - pip3 install wheel  # install wheel first explicitly
-        - pip3 install --upgrade pyyaml
-      script:
-        - >
-          ${MVN} apache-rat:check -Prat --fail-at-end
-          -Dorg.slf4j.simpleLogger.log.org.apache.maven.cli.transfer.Slf4jMavenTransferListener=warn
-          -Drat.consoleOutput=true ${HADOOP_PROFILE}
-        # Generate dependency reports and checks they are valid. When running on Travis CI, 2 cores are available
-        # (https://docs.travis-ci.com/user/reference/overview/#virtualisation-environment-vs-operating-system).
-        - mkdir -p target
-        - distribution/bin/generate-license-dependency-reports.py . target --clean-maven-artifact-transfer --parallel 2
-        - distribution/bin/check-licenses.py licenses.yaml target/license-reports
-
-    - <<: *license_checks
-      name: "license checks with Hadoop3"
-      env:
-        - HADOOP_PROFILE='-Phadoop3'
-
-    - name: "script checks"
-      install: skip
-      # who watches the watchers?
-      script: ./check_test_suite_test.py
-
-    - name: "(openjdk11) strict compilation"
-      install: skip
-      # errorprone requires JDK 11
-      jdk: openjdk11
-      # Strict compilation requires more than 2 GB
-      script: >
-        ./check_test_suite.py && travis_terminate 0 || MAVEN_OPTS='-Xmx3000m' ${MVN} clean -DstrictCompile compile test-compile --fail-at-end
-        ${MAVEN_SKIP} ${MAVEN_SKIP_TESTS}
-
-    - &analyze_dependencies
-      name: "analyze dependencies"
-      script: |-
-        MAVEN_OPTS='-Xmx3000m' ${MVN} ${MAVEN_SKIP} dependency:analyze -DoutputXML=true -DignoreNonCompile=true -DfailOnWarning=true ${HADOOP_PROFILE} || { echo "
-
-        The dependency analysis has found a dependency that is either:
-
-        1) Used and undeclared: These are available as a transitive dependency but should be explicitly
-        added to the POM to ensure the dependency version. The XML to add the dependencies to the POM is
-        shown above.
-
-        2) Unused and declared: These are not needed and removing them from the POM will speed up the build
-        and reduce the artifact size. The dependencies to remove are shown above.
-
-        If there are false positive dependency analysis warnings, they can be suppressed:
-        https://maven.apache.org/plugins/maven-dependency-plugin/analyze-mojo.html#usedDependencies
-        https://maven.apache.org/plugins/maven-dependency-plugin/examples/exclude-dependencies-from-dependency-analysis.html
-
-        For more information, refer to:
-        https://maven.apache.org/plugins/maven-dependency-plugin/analyze-mojo.html
-
-        " && false; }
-
-    - <<: *analyze_dependencies
-      name: "analyze hadoop 3 dependencies"
-      env:
-        - HADOOP_PROFILE='-Phadoop3'
-
-    - name: "intellij inspections"
-      script: >
-        ./check_test_suite.py && travis_terminate 0 || docker run --rm
-        -v $(pwd):/project
-        -v ~/.m2:/home/inspect/.m2
-        ccaominh/intellij-inspect:1.0.0
-        /project/pom.xml
-        /project/.idea/inspectionProfiles/Druid.xml
-        --levels ERROR
-        --scope JavaInspectionsScope
-
-    - &package
-      name: "(openjdk8) packaging check"
-      install: skip
-      before_script: *setup_generate_license
-      script: >
-        MAVEN_OPTS='-Xmx3000m' ${MVN} clean install -Prat -Pdist -Pbundle-contrib-exts --fail-at-end
-        -pl '!benchmarks' ${MAVEN_SKIP} ${MAVEN_SKIP_TESTS} -Dweb.console.skip=false -T1C
-
-    - <<: *package
-      name: "(openjdk11) packaging check"
-      stage: Tests - phase 2
-      jdk: openjdk11
-
-    - <<: *package
-      name: "(openjdk17) packaging check"
-      stage: Tests - phase 2
-      jdk: openjdk17
-
     - &test_processing_module
       name: "(openjdk8) processing module test"
       stage: Tests - phase 1
@@ -366,36 +252,6 @@ jobs:
       stage: Tests - phase 2
       jdk: openjdk17
 
-    - name: "web console"
-      install: skip
-      stage: Tests - phase 1
-      script:
-        - ./check_test_suite.py && travis_terminate 0 || ${MVN} test -pl 'web-console'
-      after_success:
-        - (cd web-console && travis_retry npm run codecov)  # retry in case of network error
-
-    - name: "web console end-to-end test"
-      stage: Tests - phase 1
-      before_install: *setup_generate_license
-      install: web-console/script/druid build
-      before_script:
-        - ./check_test_suite.py && travis_terminate 0 || echo 'Starting nvm install...'
-        - nvm install 16.17.0
-        - web-console/script/druid start
-      script: (cd web-console && npm run test-e2e)
-      after_script: web-console/script/druid stop
-
-    - name: "docs"
-      stage: Tests - phase 1
-      before_script:
-        - ./check_test_suite.py && travis_terminate 0 || echo 'Starting nvm install...'
-        - nvm install 16.17.0
-        - (cd website && npm install)
-      script:
-        - cd website
-        - npm run link-lint
-        - npm run spellcheck
-
     - name: "Build and test on ARM64 CPU architecture (1)"
       stage: Tests - phase 2
       arch: arm64-graviton2
diff --git a/benchmarks/pom.xml b/benchmarks/pom.xml
index 842fe65f86ce..39590175727e 100644
--- a/benchmarks/pom.xml
+++ b/benchmarks/pom.xml
@@ -27,7 +27,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
   </parent>
 
   <dependencies>
diff --git a/cloud/aws-common/pom.xml b/cloud/aws-common/pom.xml
index 73c0288dfad3..ebfe95bcfe84 100644
--- a/cloud/aws-common/pom.xml
+++ b/cloud/aws-common/pom.xml
@@ -28,7 +28,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/cloud/gcp-common/pom.xml b/cloud/gcp-common/pom.xml
index d755b7cf844e..2bfa4ec33165 100644
--- a/cloud/gcp-common/pom.xml
+++ b/cloud/gcp-common/pom.xml
@@ -28,7 +28,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/core/pom.xml b/core/pom.xml
index 2f8b9dc0b1d2..6727aa4ca0e3 100644
--- a/core/pom.xml
+++ b/core/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <artifactId>druid</artifactId>
     <groupId>org.apache.druid</groupId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
   </parent>
 
   <properties>
diff --git a/core/src/main/java/org/apache/druid/data/input/impl/HttpInputSourceConfig.java b/core/src/main/java/org/apache/druid/data/input/impl/HttpInputSourceConfig.java
index 40a2521b1186..310c66904619 100644
--- a/core/src/main/java/org/apache/druid/data/input/impl/HttpInputSourceConfig.java
+++ b/core/src/main/java/org/apache/druid/data/input/impl/HttpInputSourceConfig.java
@@ -76,7 +76,7 @@ public int hashCode()
   public String toString()
   {
     return "HttpInputSourceConfig{" +
-           ", allowedProtocols=" + allowedProtocols +
+           "allowedProtocols=" + allowedProtocols +
            '}';
   }
 }
diff --git a/core/src/main/java/org/apache/druid/data/input/impl/LocalInputSource.java b/core/src/main/java/org/apache/druid/data/input/impl/LocalInputSource.java
index 688f8b1140bf..e811de7cc308 100644
--- a/core/src/main/java/org/apache/druid/data/input/impl/LocalInputSource.java
+++ b/core/src/main/java/org/apache/druid/data/input/impl/LocalInputSource.java
@@ -228,4 +228,14 @@ public int hashCode()
   {
     return Objects.hash(baseDir, filter, files);
   }
+
+  @Override
+  public String toString()
+  {
+    return "LocalInputSource{" +
+        "baseDir=\"" + baseDir +
+        "\", filter=" + filter +
+        ", files=" + files +
+        "}";
+  }
 }
diff --git a/core/src/main/java/org/apache/druid/guice/DruidSecondaryModule.java b/core/src/main/java/org/apache/druid/guice/DruidSecondaryModule.java
index d2a3fd0d52fb..a22ef051457b 100644
--- a/core/src/main/java/org/apache/druid/guice/DruidSecondaryModule.java
+++ b/core/src/main/java/org/apache/druid/guice/DruidSecondaryModule.java
@@ -36,6 +36,7 @@
 import javax.validation.Validator;
 import java.util.Properties;
 
+@LazySingleton
 public class DruidSecondaryModule implements Module
 {
   private final Properties properties;
diff --git a/core/src/main/java/org/apache/druid/java/util/common/Intervals.java b/core/src/main/java/org/apache/druid/java/util/common/Intervals.java
index b7a1f37cf1c3..96f858fd4be2 100644
--- a/core/src/main/java/org/apache/druid/java/util/common/Intervals.java
+++ b/core/src/main/java/org/apache/druid/java/util/common/Intervals.java
@@ -20,10 +20,13 @@
 package org.apache.druid.java.util.common;
 
 import com.google.common.collect.ImmutableList;
+import org.apache.druid.java.util.common.guava.Comparators;
 import org.joda.time.DateTime;
 import org.joda.time.Interval;
 import org.joda.time.chrono.ISOChronology;
 
+import javax.annotation.Nullable;
+
 public final class Intervals
 {
   public static final Interval ETERNITY = utc(JodaUtils.MIN_INSTANT, JodaUtils.MAX_INSTANT);
@@ -68,6 +71,32 @@ public static boolean isEternity(final Interval interval)
     return ETERNITY.equals(interval);
   }
 
+  /**
+   * Finds an interval from the given set of sortedIntervals which overlaps with
+   * the searchInterval. If multiple candidate intervals overlap with the
+   * searchInterval, the "smallest" interval based on the
+   * {@link Comparators#intervalsByStartThenEnd()} is returned.
+   *
+   * @param searchInterval  Interval which should overlap with the result
+   * @param sortedIntervals Candidate overlapping intervals, sorted in ascending
+   *                        order, using {@link Comparators#intervalsByStartThenEnd()}.
+   * @return The first overlapping interval, if one exists, otherwise null.
+   */
+  @Nullable
+  public static Interval findOverlappingInterval(Interval searchInterval, Interval[] sortedIntervals)
+  {
+    for (Interval interval : sortedIntervals) {
+      if (interval.overlaps(searchInterval)) {
+        return interval;
+      } else if (interval.getStart().isAfter(searchInterval.getEnd())) {
+        // Intervals after this cannot have an overlap
+        return null;
+      }
+    }
+
+    return null;
+  }
+
   private Intervals()
   {
   }
diff --git a/core/src/main/java/org/apache/druid/java/util/common/Pair.java b/core/src/main/java/org/apache/druid/java/util/common/Pair.java
index 4b2acad6f1b9..69720192b8f0 100644
--- a/core/src/main/java/org/apache/druid/java/util/common/Pair.java
+++ b/core/src/main/java/org/apache/druid/java/util/common/Pair.java
@@ -26,7 +26,6 @@
  */
 public class Pair<T1, T2>
 {
-
   public static <T1, T2> Pair<T1, T2> of(@Nullable T1 lhs, @Nullable T2 rhs)
   {
     return new Pair<>(lhs, rhs);
@@ -56,7 +55,7 @@ public boolean equals(Object o)
     if (!(o instanceof Pair)) {
       return false;
     }
-    Pair pair = (Pair) o;
+    Pair<?, ?> pair = (Pair<?, ?>) o;
     return Objects.equals(lhs, pair.lhs) && Objects.equals(rhs, pair.rhs);
   }
 
diff --git a/core/src/main/java/org/apache/druid/java/util/common/StringUtils.java b/core/src/main/java/org/apache/druid/java/util/common/StringUtils.java
index 41078961a0c8..26d6f0c80dc4 100644
--- a/core/src/main/java/org/apache/druid/java/util/common/StringUtils.java
+++ b/core/src/main/java/org/apache/druid/java/util/common/StringUtils.java
@@ -20,9 +20,13 @@
 package org.apache.druid.java.util.common;
 
 import com.google.common.base.Strings;
+import org.apache.commons.io.IOUtils;
 
 import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
+
+import java.io.IOException;
+import java.io.InputStream;
 import java.io.UnsupportedEncodingException;
 import java.net.URLDecoder;
 import java.net.URLEncoder;
@@ -797,4 +801,18 @@ public static String fastLooseChop(@Nullable final String s, final int maxBytes)
       return s.substring(0, maxBytes);
     }
   }
+
+  public static String getResource(Object ref, String resource)
+  {
+    try {
+      InputStream is = ref.getClass().getResourceAsStream(resource);
+      if (is == null) {
+        throw new ISE("Resource not found: [%s]", resource);
+      }
+      return IOUtils.toString(is, StandardCharsets.UTF_8);
+    }
+    catch (IOException e) {
+      throw new ISE(e, "Cannot load resource: [%s]", resource);
+    }
+  }
 }
diff --git a/core/src/main/java/org/apache/druid/java/util/common/guava/ParallelMergeCombiningSequence.java b/core/src/main/java/org/apache/druid/java/util/common/guava/ParallelMergeCombiningSequence.java
index 7bb80aae8988..da7904240680 100644
--- a/core/src/main/java/org/apache/druid/java/util/common/guava/ParallelMergeCombiningSequence.java
+++ b/core/src/main/java/org/apache/druid/java/util/common/guava/ParallelMergeCombiningSequence.java
@@ -76,6 +76,7 @@ public class ParallelMergeCombiningSequence<T> extends YieldingSequenceBase<T>
   private final BinaryOperator<T> combineFn;
   private final int queueSize;
   private final boolean hasTimeout;
+  private final long startTimeNanos;
   private final long timeoutAtNanos;
   private final int yieldAfter;
   private final int batchSize;
@@ -105,12 +106,13 @@ public ParallelMergeCombiningSequence(
     this.orderingFn = orderingFn;
     this.combineFn = combineFn;
     this.hasTimeout = hasTimeout;
-    this.timeoutAtNanos = System.nanoTime() + TimeUnit.NANOSECONDS.convert(timeoutMillis, TimeUnit.MILLISECONDS);
+    this.startTimeNanos = System.nanoTime();
+    this.timeoutAtNanos = startTimeNanos + TimeUnit.NANOSECONDS.convert(timeoutMillis, TimeUnit.MILLISECONDS);
     this.parallelism = parallelism;
     this.yieldAfter = yieldAfter;
     this.batchSize = batchSize;
     this.targetTimeNanos = TimeUnit.NANOSECONDS.convert(targetTimeMillis, TimeUnit.MILLISECONDS);
-    this.queueSize = 4 * (yieldAfter / batchSize);
+    this.queueSize = (1 << 15) / batchSize; // each queue can by default hold ~32k rows
     this.metricsReporter = reporter;
     this.cancellationGizmo = new CancellationGizmo();
   }
@@ -121,8 +123,9 @@ public <OutType> Yielder<OutType> toYielder(OutType initValue, YieldingAccumulat
     if (inputSequences.isEmpty()) {
       return Sequences.<T>empty().toYielder(initValue, accumulator);
     }
-
-    final BlockingQueue<ResultBatch<T>> outputQueue = new ArrayBlockingQueue<>(queueSize);
+    // we make final output queue larger than the merging queues so if downstream readers are slower to read there is
+    // less chance of blocking the merge
+    final BlockingQueue<ResultBatch<T>> outputQueue = new ArrayBlockingQueue<>(4 * queueSize);
     final MergeCombineMetricsAccumulator metricsAccumulator = new MergeCombineMetricsAccumulator(inputSequences.size());
     MergeCombinePartitioningAction<T> mergeCombineAction = new MergeCombinePartitioningAction<>(
         inputSequences,
@@ -147,6 +150,7 @@ public <OutType> Yielder<OutType> toYielder(OutType initValue, YieldingAccumulat
         cancellationGizmo
     ).withBaggage(() -> {
       if (metricsReporter != null) {
+        metricsAccumulator.setTotalWallTime(System.nanoTime() - startTimeNanos);
         metricsReporter.accept(metricsAccumulator.build());
       }
     });
@@ -698,6 +702,8 @@ private static class PrepareMergeCombineInputsAction<T> extends RecursiveAction
     private final MergeCombineActionMetricsAccumulator metricsAccumulator;
     private final CancellationGizmo cancellationGizmo;
 
+    private final long startTime;
+
     private PrepareMergeCombineInputsAction(
         List<BatchedResultsCursor<T>> partition,
         QueuePusher<ResultBatch<T>> outputQueue,
@@ -719,6 +725,7 @@ private PrepareMergeCombineInputsAction(
       this.targetTimeNanos = targetTimeNanos;
       this.metricsAccumulator = metricsAccumulator;
       this.cancellationGizmo = cancellationGizmo;
+      this.startTime = System.nanoTime();
     }
 
     @SuppressWarnings("unchecked")
@@ -736,7 +743,6 @@ protected void compute()
             cursor.close();
           }
         }
-
         if (cursors.size() > 0) {
           getPool().execute(new MergeCombineAction<T>(
               cursors,
@@ -753,6 +759,7 @@ protected void compute()
         } else {
           outputQueue.offer(ResultBatch.TERMINAL);
         }
+        metricsAccumulator.setPartitionInitializedTime(System.nanoTime() - startTime);
       }
       catch (Throwable t) {
         closeAllCursors(partition);
@@ -1195,6 +1202,9 @@ public static class MergeCombineMetrics
     private final long outputRows;
     private final long taskCount;
     private final long totalCpuTime;
+    private final long totalWallTime;
+    private final long fastestPartitionInitializedTime;
+    private final long slowestPartitionInitializedTime;
 
     MergeCombineMetrics(
         int parallelism,
@@ -1202,7 +1212,10 @@ public static class MergeCombineMetrics
         long inputRows,
         long outputRows,
         long taskCount,
-        long totalCpuTime
+        long totalCpuTime,
+        long totalWallTime,
+        long fastestPartitionInitializedTime,
+        long slowestPartitionInitializedTime
     )
     {
       this.parallelism = parallelism;
@@ -1211,6 +1224,9 @@ public static class MergeCombineMetrics
       this.outputRows = outputRows;
       this.taskCount = taskCount;
       this.totalCpuTime = totalCpuTime;
+      this.totalWallTime = totalWallTime;
+      this.fastestPartitionInitializedTime = fastestPartitionInitializedTime;
+      this.slowestPartitionInitializedTime = slowestPartitionInitializedTime;
     }
 
     /**
@@ -1263,6 +1279,21 @@ public long getTotalCpuTime()
     {
       return totalCpuTime;
     }
+
+    public long getTotalTime()
+    {
+      return totalWallTime;
+    }
+
+    public long getFastestPartitionInitializedTime()
+    {
+      return fastestPartitionInitializedTime;
+    }
+
+    public long getSlowestPartitionInitializedTime()
+    {
+      return slowestPartitionInitializedTime;
+    }
   }
 
   /**
@@ -1274,6 +1305,9 @@ static class MergeCombineMetricsAccumulator
   {
     List<MergeCombineActionMetricsAccumulator> partitionMetrics;
     MergeCombineActionMetricsAccumulator mergeMetrics;
+
+    private long totalWallTime;
+
     private final int inputSequences;
 
     MergeCombineMetricsAccumulator(int inputSequences)
@@ -1291,6 +1325,11 @@ void setPartitions(List<MergeCombineActionMetricsAccumulator> partitionMetrics)
       this.partitionMetrics = partitionMetrics;
     }
 
+    void setTotalWallTime(long time)
+    {
+      this.totalWallTime = time;
+    }
+
     MergeCombineMetrics build()
     {
       long numInputRows = 0;
@@ -1299,11 +1338,20 @@ MergeCombineMetrics build()
       // partition
       long totalPoolTasks = 1 + 1 + partitionMetrics.size();
 
+      long fastestPartInitialized = partitionMetrics.size() > 0 ? Long.MAX_VALUE : mergeMetrics.getPartitionInitializedtime();
+      long slowestPartInitialied = partitionMetrics.size() > 0 ? Long.MIN_VALUE : mergeMetrics.getPartitionInitializedtime();
+
       // accumulate input row count, cpu time, and total number of tasks from each partition
       for (MergeCombineActionMetricsAccumulator partition : partitionMetrics) {
         numInputRows += partition.getInputRows();
         cpuTimeNanos += partition.getTotalCpuTimeNanos();
         totalPoolTasks += partition.getTaskCount();
+        if (partition.getPartitionInitializedtime() < fastestPartInitialized) {
+          fastestPartInitialized = partition.getPartitionInitializedtime();
+        }
+        if (partition.getPartitionInitializedtime() > slowestPartInitialied) {
+          slowestPartInitialied = partition.getPartitionInitializedtime();
+        }
       }
       // if serial merge done, only mergeMetrics is populated, get input rows from there instead. otherwise, ignore the
       // value as it is only the number of intermediary input rows to the layer 2 task
@@ -1322,7 +1370,10 @@ MergeCombineMetrics build()
           numInputRows,
           numOutputRows,
           totalPoolTasks,
-          cpuTimeNanos
+          cpuTimeNanos,
+          totalWallTime,
+          fastestPartInitialized,
+          slowestPartInitialied
       );
     }
   }
@@ -1337,6 +1388,8 @@ static class MergeCombineActionMetricsAccumulator
     private long outputRows = 0;
     private long totalCpuTimeNanos = 0;
 
+    private long partitionInitializedtime = 0L;
+
     void incrementTaskCount()
     {
       taskCount++;
@@ -1357,6 +1410,11 @@ void incrementCpuTimeNanos(long nanos)
       totalCpuTimeNanos += nanos;
     }
 
+    void setPartitionInitializedTime(long nanos)
+    {
+      partitionInitializedtime = nanos;
+    }
+
     long getTaskCount()
     {
       return taskCount;
@@ -1376,6 +1434,11 @@ long getTotalCpuTimeNanos()
     {
       return totalCpuTimeNanos;
     }
+
+    long getPartitionInitializedtime()
+    {
+      return partitionInitializedtime;
+    }
   }
 
   private static <T> void closeAllCursors(final Collection<BatchedResultsCursor<T>> cursors)
diff --git a/core/src/main/java/org/apache/druid/java/util/common/parsers/ObjectFlatteners.java b/core/src/main/java/org/apache/druid/java/util/common/parsers/ObjectFlatteners.java
index 4e955a4d50b8..98f087333a55 100644
--- a/core/src/main/java/org/apache/druid/java/util/common/parsers/ObjectFlatteners.java
+++ b/core/src/main/java/org/apache/druid/java/util/common/parsers/ObjectFlatteners.java
@@ -29,6 +29,7 @@
 import java.util.AbstractMap;
 import java.util.ArrayList;
 import java.util.Collection;
+import java.util.Collections;
 import java.util.HashMap;
 import java.util.LinkedHashMap;
 import java.util.LinkedHashSet;
@@ -250,15 +251,23 @@ default Function<T, Object> makeJsonTreeExtractor(List<String> nodes)
      */
     default Map<String, Object> toMap(T obj)
     {
-      return (Map<String, Object>) toPlainJavaType(obj);
+      final Object mapOrNull = toPlainJavaType(obj);
+      if (mapOrNull == null) {
+        return Collections.emptyMap();
+      }
+      return (Map<String, Object>) mapOrNull;
     }
 
     /**
      * Recursively traverse "json" object using a {@link JsonProvider}, converting to Java {@link Map} and {@link List},
      * potentially transforming via {@link #finalizeConversionForMap} as we go
      */
+    @Nullable
     default Object toPlainJavaType(Object o)
     {
+      if (o == null) {
+        return null;
+      }
       final JsonProvider jsonProvider = getJsonProvider();
       if (jsonProvider.isMap(o)) {
         Map<String, Object> actualMap = new HashMap<>();
@@ -287,7 +296,7 @@ default Object toPlainJavaType(Object o)
         return finalizeConversionForMap(actualList);
       }
       // unknown, just pass it through
-      return o;
+      return finalizeConversionForMap(o);
     }
 
     /**
diff --git a/core/src/main/java/org/apache/druid/java/util/emitter/core/SwitchingEmitter.java b/core/src/main/java/org/apache/druid/java/util/emitter/core/SwitchingEmitter.java
new file mode 100644
index 000000000000..1dedd548294e
--- /dev/null
+++ b/core/src/main/java/org/apache/druid/java/util/emitter/core/SwitchingEmitter.java
@@ -0,0 +1,167 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.java.util.emitter.core;
+
+import com.google.common.collect.ImmutableSet;
+import org.apache.druid.java.util.common.lifecycle.LifecycleStart;
+import org.apache.druid.java.util.common.lifecycle.LifecycleStop;
+import org.apache.druid.java.util.common.logger.Logger;
+
+import java.io.IOException;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+
+/**
+ * An emitter than that offers the ability to direct an event to multiple emitters based on the event's feed.
+ */
+public class SwitchingEmitter implements Emitter
+{
+
+  private static final Logger log = new Logger(SwitchingEmitter.class);
+
+  private final Emitter[] defaultEmitters;
+
+  private final Map<String, List<Emitter>> feedToEmitters;
+  private final Set<Emitter> knownEmitters;
+
+  /**
+   * Constructor for the SwitchingEmitter
+   *
+   * @param feedToEmitters Map of feed to a list of emitters that correspond to each feed,
+   * @param defaultEmitter A list of emitters to use if there isn't a match of feed to an emitter
+   */
+  public SwitchingEmitter(Map<String, List<Emitter>> feedToEmitters, Emitter[] defaultEmitter)
+  {
+    this.feedToEmitters = feedToEmitters;
+    this.defaultEmitters = defaultEmitter;
+    ImmutableSet.Builder<Emitter> emittersSetBuilder = new ImmutableSet.Builder<>();
+    emittersSetBuilder.addAll(Arrays.stream(defaultEmitter).iterator());
+    for (List<Emitter> emitterList : feedToEmitters.values()) {
+      for (Emitter emitter : emitterList) {
+        emittersSetBuilder.add(emitter);
+      }
+    }
+    this.knownEmitters = emittersSetBuilder.build();
+  }
+
+  /**
+   * Start the emitter. This will start all the emitters the SwitchingEmitter uses.
+   */
+  @Override
+  @LifecycleStart
+  public void start()
+  {
+    log.info("Starting Switching Emitter.");
+
+    for (Emitter e : knownEmitters) {
+      log.info("Starting emitter %s.", e.getClass().getName());
+      e.start();
+    }
+  }
+
+  /**
+   * Emit an event. This method must not throw exceptions or block. The emitters that this uses must also not throw
+   * exceptions or block.
+   * <p>
+   * This emitter will direct events based on feed to a list of emitters specified. If there is no match the event will
+   * use a list of default emitters instead.
+   * <p>
+   * Emitters that this emitter uses that receive too many events and internal queues fill up, should drop events rather
+   * than blocking or consuming excessive memory.
+   * <p>
+   * If an emitter that this emitter uses receives input it considers to be invalid, or has an internal problem, it
+   * should deal with that by logging a warning rather than throwing an exception. Emitters that log warnings
+   * should consider throttling warnings to avoid excessive logs, since a busy Druid cluster can emit a high volume of
+   * events.
+   *
+   * @param event The event that will be emitted.
+   */
+  @Override
+  public void emit(Event event)
+  {
+    // linear search is likely faster than hashed lookup
+    for (Map.Entry<String, List<Emitter>> feedToEmitters : feedToEmitters.entrySet()) {
+      if (feedToEmitters.getKey().equals(event.getFeed())) {
+        for (Emitter emitter : feedToEmitters.getValue()) {
+          emitter.emit(event);
+        }
+        return;
+      }
+    }
+    for (Emitter emitter : defaultEmitters) {
+      emitter.emit(event);
+    }
+  }
+
+  /**
+   * Triggers this emitter to tell all emitters that this uses to flush.
+   * @throws IOException
+   */
+  @Override
+  public void flush() throws IOException
+  {
+    boolean fail = false;
+    log.info("Flushing Switching Emitter.");
+
+    for (Emitter e : knownEmitters) {
+      try {
+        log.info("Flushing emitter %s.", e.getClass().getName());
+        e.flush();
+      }
+      catch (IOException ex) {
+        log.error(ex, "Failed to flush emitter [%s]", e.getClass().getName());
+        fail = true;
+      }
+    }
+
+    if (fail) {
+      throw new IOException("failed to flush one or more emitters");
+    }
+  }
+
+  /**
+   * Closes all emitters that the SwitchingEmitter uses
+   * @throws IOException
+   */
+  @Override
+  @LifecycleStop
+  public void close() throws IOException
+  {
+    boolean fail = false;
+    log.info("Closing Switching Emitter.");
+
+    for (Emitter e : knownEmitters) {
+      try {
+        log.info("Closing emitter %s.", e.getClass().getName());
+        e.close();
+      }
+      catch (IOException ex) {
+        log.error(ex, "Failed to close emitter [%s]", e.getClass().getName());
+        fail = true;
+      }
+    }
+
+    if (fail) {
+      throw new IOException("failed to close one or more emitters");
+    }
+  }
+}
diff --git a/core/src/main/java/org/apache/druid/segment/column/TypeStrategies.java b/core/src/main/java/org/apache/druid/segment/column/TypeStrategies.java
index 54a15b1dbdf3..20507c597b0f 100644
--- a/core/src/main/java/org/apache/druid/segment/column/TypeStrategies.java
+++ b/core/src/main/java/org/apache/druid/segment/column/TypeStrategies.java
@@ -236,8 +236,6 @@ public static void checkMaxSize(int available, int maxSizeBytes, TypeSignature<?
    */
   public static final class LongTypeStrategy implements TypeStrategy<Long>
   {
-    private static final Comparator<Long> COMPARATOR = Longs::compare;
-
     @Override
     public int estimateSizeBytes(Long value)
     {
@@ -276,9 +274,9 @@ public int write(ByteBuffer buffer, Long value, int maxSizeBytes)
     }
 
     @Override
-    public int compare(Long o1, Long o2)
+    public int compare(Object o1, Object o2)
     {
-      return COMPARATOR.compare(o1, o2);
+      return Longs.compare(((Number) o1).longValue(), ((Number) o2).longValue());
     }
   }
 
@@ -289,8 +287,6 @@ public int compare(Long o1, Long o2)
    */
   public static final class FloatTypeStrategy implements TypeStrategy<Float>
   {
-    private static final Comparator<Float> COMPARATOR = Floats::compare;
-
     @Override
     public int estimateSizeBytes(Float value)
     {
@@ -329,9 +325,9 @@ public int write(ByteBuffer buffer, Float value, int maxSizeBytes)
     }
 
     @Override
-    public int compare(Float o1, Float o2)
+    public int compare(Object o1, Object o2)
     {
-      return COMPARATOR.compare(o1, o2);
+      return Floats.compare(((Number) o1).floatValue(), ((Number) o2).floatValue());
     }
   }
 
@@ -342,7 +338,6 @@ public int compare(Float o1, Float o2)
    */
   public static final class DoubleTypeStrategy implements TypeStrategy<Double>
   {
-    private static final Comparator<Double> COMPARATOR = Double::compare;
 
     @Override
     public int estimateSizeBytes(Double value)
@@ -382,9 +377,9 @@ public int write(ByteBuffer buffer, Double value, int maxSizeBytes)
     }
 
     @Override
-    public int compare(Double o1, Double o2)
+    public int compare(Object o1, Object o2)
     {
-      return COMPARATOR.compare(o1, o2);
+      return Double.compare(((Number) o1).doubleValue(), ((Number) o2).doubleValue());
     }
   }
 
@@ -437,7 +432,7 @@ public int write(ByteBuffer buffer, String value, int maxSizeBytes)
     }
 
     @Override
-    public int compare(String s, String s2)
+    public int compare(Object s, Object s2)
     {
       // copy of lexicographical string comparator in druid processing
       // Avoid comparisons for equal references
@@ -447,7 +442,7 @@ public int compare(String s, String s2)
         return 0;
       }
 
-      return ORDERING.compare(s, s2);
+      return ORDERING.compare((String) s, (String) s2);
     }
   }
 
@@ -521,8 +516,11 @@ public int write(ByteBuffer buffer, Object[] value, int maxSizeBytes)
     }
 
     @Override
-    public int compare(@Nullable Object[] o1, @Nullable Object[] o2)
+    public int compare(@Nullable Object o1Obj, @Nullable Object o2Obj)
     {
+      Object[] o1 = (Object[]) o1Obj;
+      Object[] o2 = (Object[]) o2Obj;
+
       //noinspection ArrayEquality
       if (o1 == o2) {
         return 0;
diff --git a/core/src/main/java/org/apache/druid/segment/column/TypeStrategy.java b/core/src/main/java/org/apache/druid/segment/column/TypeStrategy.java
index 8a97882d54df..e4856f889714 100644
--- a/core/src/main/java/org/apache/druid/segment/column/TypeStrategy.java
+++ b/core/src/main/java/org/apache/druid/segment/column/TypeStrategy.java
@@ -55,8 +55,15 @@
  * Implementations of this interface should be thread safe, but may not use {@link ByteBuffer} in a thread safe manner,
  * potentially modifying positions and limits, either temporarily or permanently depending on which set of methods is
  * called.
+ *
+ * This interface extends {@code Comparator<Object>} instead of {@code Comparator<T>} because trying to specialize the
+ * type of the comparison method can run into issues for comparators of objects that can sometimes be of a different
+ * java class type.  For example, {@code Comparator<Long>} cannot accept Integer objects in its comparison method
+ * and there is no easy way for this interface definition to allow {@code TypeStrategy<Long>} to actually be a
+ * {@code Comparator<Number>}.  So, we fall back to effectively erasing the generic type and having them all be
+ * {@code Comparator<Object>}.
  */
-public interface TypeStrategy<T> extends Comparator<T>
+public interface TypeStrategy<T> extends Comparator<Object>
 {
   /**
    * Estimate the size in bytes that writing this value to memory would require. This method is not required to be
diff --git a/core/src/main/java/org/apache/druid/utils/RuntimeInfo.java b/core/src/main/java/org/apache/druid/utils/RuntimeInfo.java
index c8dadfd44d19..86571eff9456 100644
--- a/core/src/main/java/org/apache/druid/utils/RuntimeInfo.java
+++ b/core/src/main/java/org/apache/druid/utils/RuntimeInfo.java
@@ -19,10 +19,12 @@
 
 package org.apache.druid.utils;
 
+import org.apache.druid.guice.LazySingleton;
 import org.apache.druid.java.util.common.UOE;
 
 import java.lang.reflect.InvocationTargetException;
 
+@LazySingleton
 public class RuntimeInfo
 {
   public int getAvailableProcessors()
diff --git a/core/src/test/java/org/apache/druid/java/util/common/IntervalsTest.java b/core/src/test/java/org/apache/druid/java/util/common/IntervalsTest.java
new file mode 100644
index 000000000000..59eac8d5a991
--- /dev/null
+++ b/core/src/test/java/org/apache/druid/java/util/common/IntervalsTest.java
@@ -0,0 +1,81 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.java.util.common;
+
+import org.apache.druid.java.util.common.guava.Comparators;
+import org.joda.time.Interval;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Arrays;
+
+public class IntervalsTest
+{
+
+  @Test
+  public void testFindOverlappingInterval()
+  {
+    final Interval[] sortedIntervals = new Interval[]{
+        Intervals.of("2019/2020"),
+        Intervals.of("2021/2022"),
+        Intervals.of("2021-04-01/2021-05-01"),
+        Intervals.of("2022/2023")
+    };
+    Arrays.sort(sortedIntervals, Comparators.intervalsByStartThenEnd());
+
+    // Search interval outside the bounds of the sorted intervals
+    Assert.assertNull(
+        Intervals.findOverlappingInterval(Intervals.of("2018/2019"), sortedIntervals)
+    );
+    Assert.assertNull(
+        Intervals.findOverlappingInterval(Intervals.of("2023/2024"), sortedIntervals)
+    );
+
+    // Search interval within bounds, overlap exists
+    // Fully overlapping interval
+    Assert.assertEquals(
+        Intervals.of("2021/2022"),
+        Intervals.findOverlappingInterval(Intervals.of("2021/2022"), sortedIntervals)
+    );
+
+    // Partially overlapping interval
+    Assert.assertEquals(
+        Intervals.of("2022/2023"),
+        Intervals.findOverlappingInterval(Intervals.of("2022-01-01/2022-01-02"), sortedIntervals)
+    );
+
+    Assert.assertEquals(
+        Intervals.of("2021/2022"),
+        Intervals.findOverlappingInterval(Intervals.of("2021-06-01/2021-07-01"), sortedIntervals)
+    );
+
+    // Overlap with multiple intervals, "smallest" one is returned
+    Assert.assertEquals(
+        Intervals.of("2021/2022"),
+        Intervals.findOverlappingInterval(Intervals.of("2021-03-01/2021-04-01"), sortedIntervals)
+    );
+
+    // Search interval within bounds, no overlap
+    Assert.assertNull(
+        Intervals.findOverlappingInterval(Intervals.of("2020-01-02/2020-03-03"), sortedIntervals)
+    );
+  }
+
+}
diff --git a/core/src/test/java/org/apache/druid/java/util/common/parsers/ObjectFlattenersTest.java b/core/src/test/java/org/apache/druid/java/util/common/parsers/ObjectFlattenersTest.java
index 2b610690db0a..e0b0fbcc510c 100644
--- a/core/src/test/java/org/apache/druid/java/util/common/parsers/ObjectFlattenersTest.java
+++ b/core/src/test/java/org/apache/druid/java/util/common/parsers/ObjectFlattenersTest.java
@@ -23,6 +23,7 @@
 import com.fasterxml.jackson.databind.JsonNode;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
 import org.junit.Assert;
 import org.junit.Test;
@@ -32,12 +33,14 @@
 public class ObjectFlattenersTest
 {
   private static final String SOME_JSON = "{\"foo\": null, \"bar\": 1}";
+
+  private static final ObjectFlatteners.FlattenerMaker FLATTENER_MAKER = new JSONFlattenerMaker(true);
   private static final ObjectFlattener FLATTENER = ObjectFlatteners.create(
       new JSONPathSpec(
           true,
           ImmutableList.of(new JSONPathFieldSpec(JSONPathFieldType.PATH, "extract", "$.bar"))
       ),
-      new JSONFlattenerMaker(true)
+      FLATTENER_MAKER
   );
   private static final ObjectMapper OBJECT_MAPPER = new ObjectMapper();
 
@@ -62,4 +65,13 @@ public void testToMap() throws JsonProcessingException
     Assert.assertNull(flat.get("foo"));
     Assert.assertEquals(1, flat.get("bar"));
   }
+
+  @Test
+  public void testToMapNull() throws JsonProcessingException
+  {
+    JsonNode node = OBJECT_MAPPER.readTree("null");
+    Map<String, Object> flat = FLATTENER.toMap(node);
+    Assert.assertNull(FLATTENER_MAKER.toPlainJavaType(node));
+    Assert.assertEquals(ImmutableMap.of(), flat);
+  }
 }
diff --git a/core/src/test/java/org/apache/druid/java/util/emitter/core/SwitchingEmitterTest.java b/core/src/test/java/org/apache/druid/java/util/emitter/core/SwitchingEmitterTest.java
new file mode 100644
index 000000000000..5183b47947af
--- /dev/null
+++ b/core/src/test/java/org/apache/druid/java/util/emitter/core/SwitchingEmitterTest.java
@@ -0,0 +1,153 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.java.util.emitter.core;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+import org.easymock.EasyMock;
+import org.junit.After;
+import org.junit.Before;
+import org.junit.Test;
+
+import java.io.IOException;
+import java.util.HashSet;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+
+public class SwitchingEmitterTest
+{
+
+  private static final String FEED_1 = "feed1";
+  private static final String FEED_2 = "feed2";
+  private static final String FEED_3 = "feed3";
+  private SwitchingEmitter switchingEmitter;
+
+  private Map<String, List<Emitter>> emitters;
+  private List<Emitter> defaultEmitters;
+
+  private Emitter feed1Emitter1;
+  private Emitter feed1Emitter2;
+  private Emitter feed2Emitter1;
+  private Emitter feed1AndFeed3Emitter;
+
+  private Set<Emitter> allEmitters;
+
+  @Before
+  public void setup()
+  {
+    this.defaultEmitters = ImmutableList.of(
+        EasyMock.createMock(Emitter.class),
+        EasyMock.createMock(Emitter.class)
+    );
+    this.feed1Emitter1 = EasyMock.createMock(Emitter.class);
+    this.feed1Emitter2 = EasyMock.createMock(Emitter.class);
+    this.feed2Emitter1 = EasyMock.createMock(Emitter.class);
+    this.feed1AndFeed3Emitter = EasyMock.createMock(Emitter.class);
+    this.emitters = ImmutableMap.of(FEED_1, ImmutableList.of(feed1Emitter1, feed1Emitter2, feed1AndFeed3Emitter),
+                                    FEED_2, ImmutableList.of(feed2Emitter1),
+                                    FEED_3, ImmutableList.of(feed1AndFeed3Emitter));
+
+    allEmitters = new HashSet<>();
+    allEmitters.addAll(defaultEmitters);
+    for (List<Emitter> feedEmitters : emitters.values()) {
+      allEmitters.addAll(feedEmitters);
+    }
+    this.switchingEmitter = new SwitchingEmitter(emitters, defaultEmitters.toArray(new Emitter[0]));
+  }
+
+  @Test
+  public void testStart()
+  {
+    for (Emitter emitter : allEmitters) {
+      emitter.start();
+      EasyMock.replay(emitter);
+    }
+
+    switchingEmitter.start();
+  }
+
+  @Test
+  public void testEmit()
+  {
+    // test emitting events to all 3 feeds and default emitter
+    Event feed1Event = EasyMock.createMock(Event.class);
+    Event feed2Event = EasyMock.createMock(Event.class);
+    Event feed3Event = EasyMock.createMock(Event.class);
+    Event eventWithNoMatchingFeed = EasyMock.createMock(Event.class);
+
+    EasyMock.expect(feed1Event.getFeed()).andReturn(FEED_1).anyTimes();
+    EasyMock.expect(feed2Event.getFeed()).andReturn(FEED_2).anyTimes();
+    EasyMock.expect(feed3Event.getFeed()).andReturn(FEED_3).anyTimes();
+    EasyMock.expect(eventWithNoMatchingFeed.getFeed()).andReturn("no-real-feed").anyTimes();
+    EasyMock.replay(feed1Event, feed2Event, feed3Event, eventWithNoMatchingFeed);
+
+    for (Emitter emitter : defaultEmitters) {
+      emitter.emit(eventWithNoMatchingFeed);
+    }
+    for (Emitter emitter : emitters.get("feed1")) {
+      emitter.emit(feed1Event);
+    }
+    for (Emitter emitter : emitters.get("feed2")) {
+      emitter.emit(feed2Event);
+    }
+    for (Emitter emitter : emitters.get("feed3")) {
+      emitter.emit(feed3Event);
+    }
+    for (Emitter emitter : allEmitters) {
+      EasyMock.replay(emitter);
+    }
+
+    switchingEmitter.emit(feed1Event);
+    switchingEmitter.emit(feed2Event);
+    switchingEmitter.emit(feed3Event);
+    switchingEmitter.emit(eventWithNoMatchingFeed);
+  }
+
+  @Test
+  public void testFlush() throws IOException
+  {
+    for (Emitter emitter : allEmitters) {
+      emitter.flush();
+      EasyMock.replay(emitter);
+    }
+
+    switchingEmitter.flush();
+  }
+
+  @Test
+  public void testClose() throws IOException
+  {
+    for (Emitter emitter : allEmitters) {
+      emitter.close();
+      EasyMock.replay(emitter);
+    }
+
+    switchingEmitter.close();
+  }
+
+  @After
+  public void tearDown()
+  {
+    for (Emitter emitter : allEmitters) {
+      EasyMock.verify(emitter);
+    }
+  }
+}
diff --git a/core/src/test/java/org/apache/druid/java/util/metrics/MetricsVerifier.java b/core/src/test/java/org/apache/druid/java/util/metrics/MetricsVerifier.java
new file mode 100644
index 000000000000..c0f2eaeaf15f
--- /dev/null
+++ b/core/src/test/java/org/apache/druid/java/util/metrics/MetricsVerifier.java
@@ -0,0 +1,98 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.java.util.metrics;
+
+import org.junit.Assert;
+
+import java.util.List;
+import java.util.Map;
+
+/**
+ * Test utility to extract and verify metric values.
+ */
+public interface MetricsVerifier
+{
+  /**
+   * Verifies that no event has been emitted for the given metric.
+   */
+  default void verifyNotEmitted(String metricName)
+  {
+    verifyEmitted(metricName, 0);
+  }
+
+  /**
+   * Verifies that the metric was emitted the expected number of times.
+   */
+  default void verifyEmitted(String metricName, int times)
+  {
+    verifyEmitted(metricName, null, times);
+  }
+
+  /**
+   * Verifies that the metric was emitted for the given dimension filters the
+   * expected number of times.
+   */
+  default void verifyEmitted(String metricName, Map<String, Object> dimensionFilters, int times)
+  {
+    Assert.assertEquals(
+        "Metric was emitted unexpected number of times.",
+        times,
+        getMetricValues(metricName, dimensionFilters).size()
+    );
+  }
+
+  /**
+   * Verifies the value of the specified metric emitted in the previous run.
+   */
+  default void verifyValue(String metricName, Number expectedValue)
+  {
+    verifyValue(metricName, null, expectedValue);
+  }
+
+  /**
+   * Verifies the value of the event corresponding to the specified metric and
+   * dimensionFilters emitted in the previous run.
+   */
+  default void verifyValue(String metricName, Map<String, Object> dimensionFilters, Number expectedValue)
+  {
+    Assert.assertEquals(expectedValue, getValue(metricName, dimensionFilters));
+  }
+
+  /**
+   * Gets the value of the event corresponding to the specified metric and
+   * dimensionFilters.
+   */
+  default Number getValue(String metricName, Map<String, Object> dimensionFilters)
+  {
+    List<Number> values = getMetricValues(metricName, dimensionFilters);
+    Assert.assertEquals(
+        "Metric must have been emitted exactly once for the given dimensions.",
+        1,
+        values.size()
+    );
+    return values.get(0);
+  }
+
+  /**
+   * Gets the metric values for the specified dimension filters.
+   */
+  List<Number> getMetricValues(String metricName, Map<String, Object> dimensionFilters);
+
+}
diff --git a/core/src/test/java/org/apache/druid/java/util/metrics/StubServiceEmitter.java b/core/src/test/java/org/apache/druid/java/util/metrics/StubServiceEmitter.java
index 653dc8a08aae..395245815792 100644
--- a/core/src/test/java/org/apache/druid/java/util/metrics/StubServiceEmitter.java
+++ b/core/src/test/java/org/apache/druid/java/util/metrics/StubServiceEmitter.java
@@ -24,12 +24,15 @@
 import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 
 import java.util.ArrayList;
+import java.util.Collections;
+import java.util.HashMap;
 import java.util.List;
+import java.util.Map;
 
-public class StubServiceEmitter extends ServiceEmitter
+public class StubServiceEmitter extends ServiceEmitter implements MetricsVerifier
 {
   private final List<Event> events = new ArrayList<>();
-  private final List<ServiceMetricEvent> metricEvents = new ArrayList<>();
+  private final Map<String, List<ServiceMetricEvent>> metricEvents = new HashMap<>();
 
   public StubServiceEmitter(String service, String host)
   {
@@ -40,7 +43,9 @@ public StubServiceEmitter(String service, String host)
   public void emit(Event event)
   {
     if (event instanceof ServiceMetricEvent) {
-      metricEvents.add((ServiceMetricEvent) event);
+      ServiceMetricEvent metricEvent = (ServiceMetricEvent) event;
+      metricEvents.computeIfAbsent(metricEvent.getMetric(), name -> new ArrayList<>())
+                  .add(metricEvent);
     }
     events.add(event);
   }
@@ -53,12 +58,29 @@ public List<Event> getEvents()
     return events;
   }
 
-  /**
-   * Gets all the metric events emitted since the previous {@link #flush()}.
-   */
-  public List<ServiceMetricEvent> getMetricEvents()
+  @Override
+  public List<Number> getMetricValues(
+      String metricName,
+      Map<String, Object> dimensionFilters
+  )
   {
-    return metricEvents;
+    final List<Number> values = new ArrayList<>();
+    final List<ServiceMetricEvent> events =
+        metricEvents.getOrDefault(metricName, Collections.emptyList());
+    final Map<String, Object> filters =
+        dimensionFilters == null ? Collections.emptyMap() : dimensionFilters;
+    for (ServiceMetricEvent event : events) {
+      final Map<String, Object> userDims = event.getUserDims();
+      boolean match = filters.keySet().stream()
+                             .map(d -> filters.get(d).equals(userDims.get(d)))
+                             .reduce((a, b) -> a && b)
+                             .orElse(true);
+      if (match) {
+        values.add(event.getValue());
+      }
+    }
+
+    return values;
   }
 
   @Override
diff --git a/core/src/test/java/org/apache/druid/segment/column/TypeStrategiesTest.java b/core/src/test/java/org/apache/druid/segment/column/TypeStrategiesTest.java
index fa6d86d21f50..66f4adcdd02d 100644
--- a/core/src/test/java/org/apache/druid/segment/column/TypeStrategiesTest.java
+++ b/core/src/test/java/org/apache/druid/segment/column/TypeStrategiesTest.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.segment.column;
 
+import com.google.common.collect.Ordering;
 import com.google.common.primitives.Longs;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.Pair;
@@ -103,7 +104,7 @@ public int write(ByteBuffer buffer, String value, int maxSizeBytes)
       }
 
       @Override
-      public int compare(String o1, String o2)
+      public int compare(Object o1, Object o2)
       {
         return 0;
       }
@@ -639,10 +640,13 @@ public int compareTo(NullableLongPair o)
   
   public static class NullableLongPairTypeStrategy implements TypeStrategy<NullableLongPair>
   {
+
+    private Ordering<NullableLongPair> ordering = Comparators.naturalNullsFirst();
+
     @Override
-    public int compare(NullableLongPair o1, NullableLongPair o2)
+    public int compare(Object o1, Object o2)
     {
-      return Comparators.<NullableLongPair>naturalNullsFirst().compare(o1, o2);
+      return ordering.compare((NullableLongPair) o1, (NullableLongPair) o2);
     }
 
     @Override
diff --git a/distribution/docker/docker-compose.yml b/distribution/docker/docker-compose.yml
index 58b7a47a4b4a..ea9adcea0d70 100644
--- a/distribution/docker/docker-compose.yml
+++ b/distribution/docker/docker-compose.yml
@@ -49,7 +49,7 @@ services:
       - ZOO_MY_ID=1
 
   coordinator:
-    image: apache/druid:0.24.0
+    image: apache/druid:24.0.1
     container_name: coordinator
     volumes:
       - druid_shared:/opt/shared
diff --git a/distribution/pom.xml b/distribution/pom.xml
index e2b7773b09d4..7b92e3436b45 100644
--- a/distribution/pom.xml
+++ b/distribution/pom.xml
@@ -30,7 +30,7 @@
     <parent>
         <artifactId>druid</artifactId>
         <groupId>org.apache.druid</groupId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
     </parent>
 
     <dependencies>
diff --git a/docs/configuration/index.md b/docs/configuration/index.md
index 6fb3201d98f4..a14b3beb56c7 100644
--- a/docs/configuration/index.md
+++ b/docs/configuration/index.md
@@ -418,6 +418,7 @@ There are several emitters available:
 - [`parametrized`](#parametrized-http-emitter-module) operates like the `http` emitter but fine-tunes the recipient URL based on the event feed.
 - [`composing`](#composing-emitter-module) initializes multiple emitter modules.
 - [`graphite`](#graphite-emitter) emits metrics to a [Graphite](https://graphiteapp.org/) Carbon service.
+- [`switching`](#switching-emitter) initializes and emits to multiple emitter modules based on the event feed.
 
 ##### Logging Emitter Module
 
@@ -483,6 +484,14 @@ Instead use `recipientBaseUrlPattern` described in the table below.
 
 To use graphite as emitter set `druid.emitter=graphite`. For configuration details, see [Graphite emitter](../development/extensions-contrib/graphite.md) for the Graphite emitter Druid extension.
 
+##### Switching Emitter
+
+To use switching as emitter set `druid.emitter=switching`. 
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.emitter.switching.emitters`|JSON map of feed to list of emitter modules that will be used for the mapped feed, e.g., {"metrics":["http"], "alerts":["logging"]}|{}|
+|`druid.emitter.switching.defaultEmitters`|JSON list of emitter modules to load that will be used if there is no emitter specifically designated for that event's feed, e.g., ["logging","http"].|[]|
 
 ### Metadata storage
 
@@ -939,7 +948,7 @@ Issuing a GET request at the same URL will return the spec that is currently in
 |`mergeBytesLimit`|The maximum total uncompressed size in bytes of segments to merge.|524288000L|
 |`mergeSegmentsLimit`|The maximum number of segments that can be in a single [append task](../ingestion/tasks.md).|100|
 |`maxSegmentsToMove`|The maximum number of segments that can be moved at any given time.|5|
-|`useBatchedSegmentSampler`|Boolean flag for whether or not we should use the Reservoir Sampling with a reservoir of size k instead of fixed size 1 to pick segments to move. This option can be enabled to speed up segment balancing process, especially if there are huge number of segments in the cluster or if there are too many segments to move.|false|
+|`useBatchedSegmentSampler`|Deprecated. Boolean flag for whether or not we should use the Reservoir Sampling with a reservoir of size k instead of fixed size 1 to pick segments to move. This option can be enabled to speed up the sampling of segments to be balanced, especially if there is a large number of segments in the cluster or if there are too many segments to move.|true|
 |`percentOfSegmentsToConsiderPerMove`|Deprecated. This will eventually be phased out by the batched segment sampler. You can enable the batched segment sampler now by setting the dynamic Coordinator config, `useBatchedSegmentSampler`, to `true`. Note that if you choose to enable the batched segment sampler, `percentOfSegmentsToConsiderPerMove` will no longer have any effect on balancing. If `useBatchedSegmentSampler == false`, this config defines the percentage of the total number of segments in the cluster that are considered every time a segment needs to be selected for a move. Druid orders servers by available capacity ascending (the least available capacity first) and then iterates over the servers. For each server, Druid iterates over the segments on the server, considering them for moving. The default config of 100% means that every segment on every server is a candidate to be moved. This should make sense for most small to medium-sized clusters. However, an admin may find it preferable to drop this value lower if they don't think that it is worthwhile to consider every single segment in the cluster each time it is looking for a segment to move.|100|
 |`replicantLifetime`|The maximum number of Coordinator runs for a segment to be replicated before we start alerting.|15|
 |`replicationThrottleLimit`|The maximum number of segments that can be replicated at one time.|10|
@@ -948,6 +957,7 @@ Issuing a GET request at the same URL will return the spec that is currently in
 |`killDataSourceWhitelist`|List of specific data sources for which kill tasks are sent if property `druid.coordinator.kill.on` is true. This can be a list of comma-separated data source names or a JSON array.|none|
 |`killPendingSegmentsSkipList`|List of data sources for which pendingSegments are _NOT_ cleaned up if property `druid.coordinator.kill.pendingSegments.on` is true. This can be a list of comma-separated data sources or a JSON array.|none|
 |`maxSegmentsInNodeLoadingQueue`|The maximum number of segments that could be queued for loading to any given server. This parameter could be used to speed up segments loading process, especially if there are "slow" nodes in the cluster (with low loading speed) or if too much segments scheduled to be replicated to some particular node (faster loading could be preferred to better segments distribution). Desired value depends on segments loading speed, acceptable replication time and number of nodes. Value 1000 could be a start point for a rather big cluster. Default value is 100. |100|
+|`useRoundRobinSegmentAssignment`|Boolean flag for whether segments should be assigned to historicals in a round robin fashion. When disabled, segment assignment is done using the chosen balancer strategy. When enabled, this can speed up segment assignments leaving balancing to move the segments to their optimal locations (based on the balancer strategy) lazily. |false|
 |`decommissioningNodes`| List of historical servers to 'decommission'. Coordinator will not assign new segments to 'decommissioning' servers,  and segments will be moved away from them to be placed on non-decommissioning servers at the maximum rate specified by `decommissioningMaxPercentOfMaxSegmentsToMove`.|none|
 |`decommissioningMaxPercentOfMaxSegmentsToMove`| Upper limit of segments the Coordinator can move from decommissioning servers to active non-decommissioning servers during a single run. This value is relative to the total maximum number of segments that can be moved at any given time based upon the value of `maxSegmentsToMove`.<br /><br />If `decommissioningMaxPercentOfMaxSegmentsToMove` is 0, the Coordinator does not move segments to decommissioning servers, effectively putting them in a type of "maintenance" mode. In this case, decommissioning servers do not participate in balancing or assignment by load rules. The Coordinator still considers segments on decommissioning servers as candidates to replicate on active servers.<br /><br />Decommissioning can stall if there are no available active servers to move the segments to. You can use the maximum percent of decommissioning segment movements to prioritize balancing or to decrease commissioning time to prevent active servers from being overloaded. The value must be between 0 and 100.|70|
 |`pauseCoordination`| Boolean flag for whether or not the coordinator should execute its various duties of coordinating the cluster. Setting this to true essentially pauses all coordination work while allowing the API to remain up. Duties that are paused include all classes that implement the `CoordinatorDuty` Interface. Such duties include: Segment balancing, Segment compaction, Emission of metrics controlled by the dynamic coordinator config `emitBalancingStats`, Submitting kill tasks for unused segments (if enabled), Logging of used segments in the cluster, Marking of newly unused or overshadowed segments, Matching and execution of load/drop rules for used segments, Unloading segments that are no longer marked as used from Historical servers. An example of when an admin may want to pause coordination would be if they are doing deep storage maintenance on HDFS Name Nodes with downtime and don't want the coordinator to be directing Historical Nodes to hit the Name Node with API requests until maintenance is done and the deep store is declared healthy for use again. |false|
@@ -1102,6 +1112,8 @@ These Overlord static configurations can be defined in the `overlord/runtime.pro
 |`druid.indexer.storage.type`|Choices are "local" or "metadata". Indicates whether incoming tasks should be stored locally (in heap) or in metadata storage. "local" is mainly for internal testing while "metadata" is recommended in production because storing incoming tasks in metadata storage allows for tasks to be resumed if the Overlord should fail.|local|
 |`druid.indexer.storage.recentlyFinishedThreshold`|Duration of time to store task results. Default is 24 hours. If you have hundreds of tasks running in a day, consider increasing this threshold.|PT24H|
 |`druid.indexer.tasklock.forceTimeChunkLock`|_**Setting this to false is still experimental**_<br/> If set, all tasks are enforced to use time chunk lock. If not set, each task automatically chooses a lock type to use. This configuration can be overwritten by setting `forceTimeChunkLock` in the [task context](../ingestion/tasks.md#context). See [Task Locking & Priority](../ingestion/tasks.md#context) for more details about locking in tasks.|true|
+|`druid.indexer.tasklock.batchSegmentAllocation`| If set to true, Druid performs segment allocate actions in batches to improve throughput and reduce the average `task/action/run/time`. See [batching `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions) for details.|false|
+|`druid.indexer.tasklock.batchAllocationWaitTime`|Number of milliseconds after Druid adds the first segment allocate action to a batch, until it executes the batch. Allows the batch to add more requests and improve the average segment allocation run time. This configuration takes effect only if `batchSegmentAllocation` is enabled.|500|
 |`druid.indexer.task.default.context`|Default task context that is applied to all tasks submitted to the Overlord. Any default in this config does not override neither the context values the user provides nor `druid.indexer.tasklock.forceTimeChunkLock`.|empty context|
 |`druid.indexer.queue.maxSize`|Maximum number of active tasks at one time.|Integer.MAX_VALUE|
 |`druid.indexer.queue.startDelay`|Sleep this long before starting Overlord queue management. This can be useful to give a cluster time to re-orient itself after e.g. a widespread network issue.|PT1M|
@@ -1375,7 +1387,7 @@ For GCE's properties, please refer to the [gce-extensions](../development/extens
 
 This section contains the configuration options for the processes that reside on Data servers (MiddleManagers/Peons and Historicals) in the suggested [three-server configuration](../design/processes.md#server-types).
 
-Configuration options for the experimental [Indexer process](../design/indexer.md) are also provided here.
+Configuration options for the [Indexer process](../design/indexer.md) are also provided here.
 
 ### MiddleManager and Peons
 
@@ -2188,7 +2200,7 @@ Supported query contexts:
 |Key|Description|Default|
 |---|-----------|-------|
 |`druid.expressions.useStrictBooleans`|Controls the behavior of Druid boolean operators and functions, if set to `true` all boolean values will be either a `1` or `0`. See [expression documentation](../misc/math-expr.md#logical-operator-modes)|false|
-|`druid.expressions.allowNestedArrays`|If enabled, Druid array expressions can create nested arrays. This is experimental and should be used with caution.|false|
+|`druid.expressions.allowNestedArrays`|If enabled, Druid array expressions can create nested arrays.|false|
 ### Router
 
 #### Router Process Configs
diff --git a/docs/development/experimental-features.md b/docs/development/experimental-features.md
new file mode 100644
index 000000000000..30d8c2f77c2b
--- /dev/null
+++ b/docs/development/experimental-features.md
@@ -0,0 +1,60 @@
+---
+id: experimental-features
+title: "Experimental features"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+The following features are marked [experimental](./experimental.md) in the Druid docs.
+
+This document includes each page that mentions an experimental feature. To graduate a feature, remove all mentions of its experimental status on all relevant pages.
+
+Note that this document does not track the status of contrib extensions, all of which are considered experimental.
+
+## SQL-based ingestion
+
+- [SQL-based ingestion](../multi-stage-query/index.md)
+- [SQL-based ingestion concepts](../multi-stage-query/concepts.md)
+- [SQL-based ingestion and multi-stage query task API](../multi-stage-query/api.md)
+
+## Indexer process
+
+- [Indexer process](../design/indexer.md)
+- [Processes and servers](../design/processes.md#indexer-process-optional)
+
+## Kubernetes
+
+- [Kubernetes](../development/extensions-core/kubernetes.md)
+
+## Segment locking
+
+- [Configuration reference](../configuration/index.md#overlord-operations)
+- [Task reference](../ingestion/tasks.md#locking)
+- [Design](../design/architecture.md#availability-and-consistency)
+
+## Front coding
+
+- [Ingestion spec reference](../ingestion/ingestion-spec.md#front-coding)
+
+## Other configuration properties
+
+- [Configuration reference](../configuration/index.md)
+   - `CLOSED_SEGMENTS_SINKS` mode
+   - Expression processing configuration `druid.expressions.allowNestedArrays`
diff --git a/docs/development/extensions-core/datasketches-tuple.md b/docs/development/extensions-core/datasketches-tuple.md
index fc4f74d5c81d..c9a05b5ab197 100644
--- a/docs/development/extensions-core/datasketches-tuple.md
+++ b/docs/development/extensions-core/datasketches-tuple.md
@@ -39,19 +39,52 @@ druid.extensions.loadList=["druid-datasketches"]
   "name" : <output_name>,
   "fieldName" : <metric_name>,
   "nominalEntries": <number>,
-  "numberOfValues" : <number>,
-  "metricColumns" : <array of strings>
+  "metricColumns" : <array of strings>,
+  "numberOfValues" : <number>
  }
 ```
 
 |property|description|required?|
 |--------|-----------|---------|
 |type|This String should always be "arrayOfDoublesSketch"|yes|
-|name|A String for the output (result) name of the calculation.|yes|
+|name|String representing the output column to store sketch values.|yes|
 |fieldName|A String for the name of the input field.|yes|
 |nominalEntries|Parameter that determines the accuracy and size of the sketch. Higher k means higher accuracy but more space to store sketches. Must be a power of 2. See the [Theta sketch accuracy](https://datasketches.apache.org/docs/Theta/ThetaErrorTable) for details. |no, defaults to 16384|
-|numberOfValues|Number of values associated with each distinct key. |no, defaults to 1|
-|metricColumns|If building sketches from raw data, an array of names of the input columns containing numeric values to be associated with each distinct key.|no, defaults to empty array|
+|metricColumns|When building sketches from raw data, an array input column that contain numeric values to associate with each distinct key. If not provided, assumes `fieldName` is an `arrayOfDoublesSketch`|no, if not provided `fieldName` is assumed to be an arrayOfDoublesSketch|
+|numberOfValues|Number of values associated with each distinct key. |no, defaults to the length of `metricColumns` if provided and 1 otherwise|
+
+You can use the `arrayOfDoublesSketch` aggregator to:
+
+- Build a sketch from raw data. In this case, set `metricColumns` to an array.
+- Build a sketch from an existing `ArrayOfDoubles` sketch . In this case, leave `metricColumns` unset and set the `fieldName` to an `ArrayOfDoubles` sketch with `numberOfValues` doubles. At ingestion time, you must base64 encode `ArrayOfDoubles`  sketches at ingestion time.
+
+#### Example on top of raw data
+
+Compute a theta of unique users. For each user store the `added` and `deleted` scores. The new sketch column will be called `users_theta`.
+
+```json
+{
+  "type": "arrayOfDoublesSketch",
+  "name": "users_theta",
+  "fieldName": "user",
+  "nominalEntries": 16384,
+  "metricColumns": ["added", "deleted"],
+}
+```
+
+#### Example ingesting a precomputed sketch column
+
+Ingest a sketch column called `user_sketches` that has a base64 encoded value of two doubles in its array and store it in a column called `users_theta`.
+
+```json
+{
+  "type": "arrayOfDoublesSketch",
+  "name": "users_theta",
+  "fieldName": "user_sketches",
+  "nominalEntries": 16384,
+  "numberOfValues": 2,
+}
+```
 
 ### Post Aggregators
 
diff --git a/docs/development/extensions-core/druid-basic-security.md b/docs/development/extensions-core/druid-basic-security.md
index b6698b4f153d..4e042b4405f3 100644
--- a/docs/development/extensions-core/druid-basic-security.md
+++ b/docs/development/extensions-core/druid-basic-security.md
@@ -53,12 +53,29 @@ To set the value for the configuration properties, add them to the common runtim
 
 ### General properties
 
-|Property|Description|Default|required|
-|--------|-----------|-------|--------|
-|`druid.auth.basic.common.pollingPeriod`|Defines in milliseconds how often processes should poll the Coordinator for the current Druid metadata store authenticator/authorizer state.|60000|No|
-|`druid.auth.basic.common.maxRandomDelay`|Defines in milliseconds the amount of random delay to add to the pollingPeriod, to spread polling requests across time.|6000|No|
-|`druid.auth.basic.common.maxSyncRetries`|Determines how many times a service will retry if the authentication/authorization Druid metadata store state sync with the Coordinator fails.|10|No|
-|`druid.auth.basic.common.cacheDirectory`|If defined, snapshots of the basic Authenticator and Authorizer Druid metadata store caches will be stored on disk in this directory. If this property is defined, when a service is starting, it will attempt to initialize its caches from these on-disk snapshots, if the service is unable to initialize its state by communicating with the Coordinator.|null|No|
+**`druid.auth.basic.common.pollingPeriod`**
+
+Defines in milliseconds how often processes should poll the Coordinator for the current Druid metadata store authenticator/authorizer state.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 60000
+
+**`druid.auth.basic.common.maxRandomDelay`**
+
+Defines in milliseconds the amount of random delay to add to the pollingPeriod, to spread polling requests across time.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 6000
+
+**`druid.auth.basic.common.maxSyncRetries`**
+
+Determines how many times a service will retry if the authentication/authorization Druid metadata store state sync with the Coordinator fails.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 10
+
+**`druid.auth.basic.common.cacheDirectory`**
+
+If defined, snapshots of the basic Authenticator and Authorizer Druid metadata store caches will be stored on disk in this directory. If this property is defined, when a service is starting, it will attempt to initialize its caches from these on-disk snapshots, if the service is unable to initialize its state by communicating with the Coordinator.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
 
 
 ### Authenticator
@@ -96,16 +113,55 @@ The remaining examples of authenticator configuration use either `MyBasicMetadat
 
 
 #### Properties for Druid metadata store user authentication
-|Property|Description|Default|required|
-|--------|-----------|-------|--------|
-|`druid.auth.authenticator.MyBasicMetadataAuthenticator.initialAdminPassword`|Initial [Password Provider](../../operations/password-provider.md) for the automatically created default admin user. If no password is specified, the default admin user will not be created. If the default admin user already exists, setting this property will not affect its password.|null|No|
-|`druid.auth.authenticator.MyBasicMetadataAuthenticator.initialInternalClientPassword`|Initial [Password Provider](../../operations/password-provider.md) for the default internal system user, used for internal process communication. If no password is specified, the default internal system user will not be created. If the default internal system user already exists, setting this property will not affect its password.|null|No|
-|`druid.auth.authenticator.MyBasicMetadataAuthenticator.enableCacheNotifications`|If true, the Coordinator will notify Druid processes whenever a configuration change to this Authenticator occurs, allowing them to immediately update their state without waiting for polling.|true|No|
-|`druid.auth.authenticator.MyBasicMetadataAuthenticator.cacheNotificationTimeout`|The timeout in milliseconds for the cache notifications.|5000|No|
-|`druid.auth.authenticator.MyBasicMetadataAuthenticator.credentialIterations`|Number of iterations to use for password hashing. See [Credential iterations and API performance](#credential-iterations-and-api-performance)|10000|No|
-|`druid.auth.authenticator.MyBasicMetadataAuthenticator.credentialsValidator.type`|The type of credentials store (metadata) to validate requests credentials.|metadata|No|
-|`druid.auth.authenticator.MyBasicMetadataAuthenticator.skipOnFailure`|If true and the request credential doesn't exists or isn't fully configured in the credentials store, the request will proceed to next Authenticator in the chain.|false|No|
-|`druid.auth.authenticator.MyBasicMetadataAuthenticator.authorizerName`|Authorizer that requests should be directed to|N/A|Yes|
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.initialAdminPassword`**
+
+Initial [Password Provider](../../operations/password-provider.md) for the automatically created default admin user. If no password is specified, the default admin user will not be created. If the default admin user already exists, setting this property will not affect its password.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.initialInternalClientPassword`**
+
+Initial [Password Provider](../../operations/password-provider.md) for the default internal system user, used for internal process communication. If no password is specified, the default internal system user will not be created. If the default internal system user already exists, setting this property will not affect its password.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.enableCacheNotifications`**
+
+If true, the Coordinator will notify Druid processes whenever a configuration change to this Authenticator occurs, allowing them to immediately update their state without waiting for polling.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: True
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.cacheNotificationTimeout`**
+
+The timeout in milliseconds for the cache notifications.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 5000
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.credentialIterations`**
+
+Number of iterations to use for password hashing. See [Credential iterations and API performance](#credential-iterations-and-api-performance)<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 10000
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.credentialsValidator.type`**
+
+The type of credentials store (metadata) to validate requests credentials.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: metadata
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.skipOnFailure`**
+
+If true and the request credential doesn't exists or isn't fully configured in the credentials store, the request will proceed to next Authenticator in the chain.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: false
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.authorizerName`**
+
+Authorizer that requests should be directed to.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
 
 ##### Credential iterations and API performance
 
@@ -121,25 +177,107 @@ If Druid uses the default credentials validator (i.e., `credentialsValidator.typ
 
 #### Properties for LDAP user authentication
 
-|Property|Description|Default|required|
-|--------|-----------|-------|--------|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.initialAdminPassword`|Initial [Password Provider](../../operations/password-provider.md) for the automatically created default admin user. If no password is specified, the default admin user will not be created. If the default admin user already exists, setting this property will not affect its password.|null|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.initialInternalClientPassword`|Initial [Password Provider](../../operations/password-provider.md) for the default internal system user, used for internal process communication. If no password is specified, the default internal system user will not be created. If the default internal system user already exists, setting this property will not affect its password.|null|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.enableCacheNotifications`|If true, the Coordinator will notify Druid processes whenever a configuration change to this Authenticator occurs, allowing them to immediately update their state without waiting for polling.|true|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.cacheNotificationTimeout`|The timeout in milliseconds for the cache notifications.|5000|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialIterations`|Number of iterations to use for password hashing.|10000|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.type`|The type of credentials store (ldap) to validate requests credentials.|metadata|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.url`|URL of the LDAP server.|null|Yes|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.bindUser`|LDAP bind user username.|null|Yes|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.bindPassword`|[Password Provider](../../operations/password-provider.md) LDAP bind user password.|null|Yes|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.baseDn`|The point from where the LDAP server will search for users.|null|Yes|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.userSearch`|The filter/expression to use for the search. For example, (&(sAMAccountName=%s)(objectClass=user))|null|Yes|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.userAttribute`|The attribute id identifying the attribute that will be returned as part of the search. For example, sAMAccountName. |null|Yes|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.credentialVerifyDuration`|The duration in seconds for how long valid credentials are verifiable within the cache when not requested.|600|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.credentialMaxDuration`|The max duration in seconds for valid credentials that can reside in cache regardless of how often they are requested.|3600|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.credentialCacheSize`|The valid credentials cache size. The cache uses a LRU policy.|100|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.skipOnFailure`|If true and the request credential doesn't exists or isn't fully configured in the credentials store, the request will proceed to next Authenticator in the chain.|false|No|
-|`druid.auth.authenticator.MyBasicLDAPAuthenticator.authorizerName`|Authorizer that requests should be directed to.|N/A|Yes|
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.initialAdminPassword`**
+
+Initial [Password Provider](../../operations/password-provider.md) for the automatically created default admin user. If no password is specified, the default admin user will not be created. If the default admin user already exists, setting this property will not affect its password.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.initialInternalClientPassword`**
+
+Initial [Password Provider](../../operations/password-provider.md) for the default internal system user, used for internal process communication. If no password is specified, the default internal system user will not be created. If the default internal system user already exists, setting this property will not affect its password.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.enableCacheNotifications`**
+
+If true, the Coordinator will notify Druid processes whenever a configuration change to this Authenticator occurs, allowing them to immediately update their state without waiting for polling.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: true
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.cacheNotificationTimeout`**
+
+The timeout in milliseconds for the cache notifications.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 5000
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialIterations`**
+
+Number of iterations to use for password hashing.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 10000
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.type`**
+
+The type of credentials store (ldap) to validate requests credentials.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: metadata
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.url`**
+
+URL of the LDAP server.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.bindUser`**
+
+LDAP bind user username.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.bindPassword`**
+
+[Password Provider](../../operations/password-provider.md) LDAP bind user password.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.baseDn`**
+
+The point from where the LDAP server will search for users.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.userSearch`**
+
+The filter/expression to use for the search. For example, (&(sAMAccountName=%s)(objectClass=user))<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.userAttribute`**
+
+The attribute id identifying the attribute that will be returned as part of the search. For example, sAMAccountName.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.credentialVerifyDuration`**
+
+The duration in seconds for how long valid credentials are verifiable within the cache when not requested.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 600
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.credentialMaxDuration`**
+
+The max duration in seconds for valid credentials that can reside in cache regardless of how often they are requested.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 3600
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.credentialCacheSize`**
+
+The valid credentials cache size. The cache uses a LRU policy.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 100
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.skipOnFailure`**
+
+If true and the request credential doesn't exists or isn't fully configured in the credentials store, the request will proceed to next Authenticator in the chain.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: false
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.authorizerName`**
+
+Authorizer that requests should be directed to.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
 
 ### Escalator
 
@@ -155,11 +293,24 @@ druid.escalator.authorizerName=MyBasicMetadataAuthorizer
 ```
 
 #### Properties
-|Property|Description|Default|required|
-|--------|-----------|-------|--------|
-|`druid.escalator.internalClientUsername`|The escalator will use this username for requests made as the internal system user.|n/a|Yes|
-|`druid.escalator.internalClientPassword`|The escalator will use this [Password Provider](../../operations/password-provider.md) for requests made as the internal system user.|n/a|Yes|
-|`druid.escalator.authorizerName`|Authorizer that requests should be directed to.|n/a|Yes|
+
+**`druid.escalator.internalClientUsername`**
+
+The escalator will use this username for requests made as the internal system user.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.escalator.internalClientPassword`**
+
+The escalator will use this [Password Provider](../../operations/password-provider.md) for requests made as the internal system user.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.escalator.authorizerName`**
+
+Authorizer that requests should be directed to.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
 
 
 ### Authorizer
@@ -182,24 +333,131 @@ druid.auth.authorizer.MyBasicMetadataAuthorizer.type=basic
 The examples in the rest of this article use `MyBasicMetadataAuthorizer` or `MyBasicLDAPAuthorizer` as the authorizer name.
 
 #### Properties for Druid metadata store user authorization
-|Property|Description|Default|required|
-|--------|-----------|-------|--------|
-|`druid.auth.authorizer.MyBasicMetadataAuthorizer.enableCacheNotifications`|If true, the Coordinator will notify Druid processes whenever a configuration change to this Authorizer occurs, allowing them to immediately update their state without waiting for polling.|true|No|
-|`druid.auth.authorizer.MyBasicMetadataAuthorizer.cacheNotificationTimeout`|The timeout in milliseconds for the cache notifications.|5000|No|
-|`druid.auth.authorizer.MyBasicMetadataAuthorizer.initialAdminUser`|The initial admin user with role defined in initialAdminRole property if specified, otherwise the default admin role will be assigned.|admin|No|
-|`druid.auth.authorizer.MyBasicMetadataAuthorizer.initialAdminRole`|The initial admin role to create if it doesn't already exists.|admin|No|
-|`druid.auth.authorizer.MyBasicMetadataAuthorizer.roleProvider.type`|The type of role provider to authorize requests credentials.|metadata|No
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.enableCacheNotifications`**
+
+If true, the Coordinator will notify Druid processes whenever a configuration change to this Authorizer occurs, allowing them to immediately update their state without waiting for polling.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: true
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.cacheNotificationTimeout`**
+
+The timeout in milliseconds for the cache notifications.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 5000
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.initialAdminUser`**
+
+The initial admin user with role defined in initialAdminRole property if specified, otherwise the default admin role will be assigned.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: admin
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.initialAdminRole`**
+
+The initial admin role to create if it doesn't already exists.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: admin
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.roleProvider.type`**
+
+The type of role provider to authorize requests credentials.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: metadata
 
 #### Properties for LDAP user authorization
-|Property|Description|Default|required|
-|--------|-----------|-------|--------|
-|`druid.auth.authorizer.MyBasicLDAPAuthorizer.enableCacheNotifications`|If true, the Coordinator will notify Druid processes whenever a configuration change to this Authorizer occurs, allowing them to immediately update their state without waiting for polling.|true|No|
-|`druid.auth.authorizer.MyBasicLDAPAuthorizer.cacheNotificationTimeout`|The timeout in milliseconds for the cache notifications.|5000|No|
-|`druid.auth.authorizer.MyBasicLDAPAuthorizer.initialAdminUser`|The initial admin user with role defined in initialAdminRole property if specified, otherwise the default admin role will be assigned.|admin|No|
-|`druid.auth.authorizer.MyBasicLDAPAuthorizer.initialAdminRole`|The initial admin role to create if it doesn't already exists.|admin|No|
-|`druid.auth.authorizer.MyBasicLDAPAuthorizer.initialAdminGroupMapping`|The initial admin group mapping with role defined in initialAdminRole property if specified, otherwise the default admin role will be assigned. The name of this initial admin group mapping will be set to adminGroupMapping|null|No|
-|`druid.auth.authorizer.MyBasicLDAPAuthorizer.roleProvider.type`|The type of role provider (ldap) to authorize requests credentials.|metadata|No
-|`druid.auth.authorizer.MyBasicLDAPAuthorizer.roleProvider.groupFilters`|Array of LDAP group filters used to filter out the allowed set of groups returned from LDAP search. Filters can be begin with *, or end with ,* to provide configurational flexibility to limit or filter allowed set of groups available to LDAP Authorizer.|null|No|
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.enableCacheNotifications`**
+
+If true, the Coordinator will notify Druid processes whenever a configuration change to this Authorizer occurs, allowing them to immediately update their state without waiting for polling.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: true
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.cacheNotificationTimeout`**
+
+The timeout in milliseconds for the cache notifications.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 5000
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.initialAdminUser`**
+
+The initial admin user with role defined in initialAdminRole property if specified, otherwise the default admin role will be assigned.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: admin
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.initialAdminRole`**
+
+The initial admin role to create if it doesn't already exists.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: admin
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.initialAdminGroupMapping`**
+
+The initial admin group mapping with role defined in initialAdminRole property if specified, otherwise the default admin role will be assigned. The name of this initial admin group mapping will be set to adminGroupMapping<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.roleProvider.type`**
+
+The type of role provider (ldap) to authorize requests credentials.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: metadata
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.roleProvider.groupFilters`**
+
+Array of LDAP group filters used to filter out the allowed set of groups returned from LDAP search. Filters can be begin with *, or end with ,* to provide configurational flexibility to limit or filter allowed set of groups available to LDAP Authorizer.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+#### Properties for LDAPS
+
+Use the following properties to configure Druid authentication with LDAP over TLS (LDAPS). See [Configure LDAP authentication](../../operations/auth-ldap.md) for more information.
+
+**`druid.auth.basic.ssl.protocol`**
+
+SSL protocol to use. The TLS version is 1.2.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: tls
+
+**`druid.auth.basic.ssl.trustStorePath`**
+
+Path to the trust store file.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.auth.basic.ssl.trustStorePassword`**
+
+Password to access the trust store file.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.auth.basic.ssl.trustStoreType`**
+
+Format of the trust store file. For Java the format is jks.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: jks
+
+**`druid.auth.basic.ssl.trustStoreAlgorithm`**
+
+Algorithm used by the trust manager to validate certificate chains.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.auth.basic.ssl.trustStorePassword`**
+
+Password details that enable access to the truststore.<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br>
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+Example LDAPS configuration:
+
+```json
+druid.auth.basic.ssl.protocol=tls
+druid.auth.basic.ssl.trustStorePath=/usr/local/druid-path/certs/truststore.jks
+druid.auth.basic.ssl.trustStorePassword=xxxxx
+druid.auth.basic.ssl.trustStoreType=jks
+druid.auth.basic.ssl.trustStoreAlgorithm=PKIX
+```
+You can configure `druid.auth.basic.ssl.trustStorePassword` to be a plain text password or you can set the password as an environment variable. See [Password providers](../../operations/password-provider.md) for more information.
 
 ## Usage
 
@@ -213,19 +471,19 @@ Root path: `/druid-ext/basic-security/authentication`
 Each API endpoint includes {authenticatorName}, specifying which Authenticator instance is being configured.
 
 ##### User/Credential Management
-`GET(/druid-ext/basic-security/authentication/db/{authenticatorName}/users)`
+`GET(/druid-ext/basic-security/authentication/db/{authenticatorName}/users)`<br>
 Return a list of all user names.
 
-`GET(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName})`
+`GET(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName})`<br>
 Return the name and credentials information of the user with name {userName}
 
-`POST(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName})`
+`POST(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName})`<br>
 Create a new user with name {userName}
 
-`DELETE(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName})`
+`DELETE(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName})`<br>
 Delete the user with name {userName}
 
-`POST(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName}/credentials)`
+`POST(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName}/credentials)`<br>
 Assign a password used for HTTP basic authentication for {userName}
 Content: JSON password request object
 
@@ -238,20 +496,20 @@ Example request body:
 ```
 
 ##### Cache Load Status
-`GET(/druid-ext/basic-security/authentication/loadStatus)`
+`GET(/druid-ext/basic-security/authentication/loadStatus)`<br>
 Return the current load status of the local caches of the authentication Druid metadata store.
 
 #### Authorization API
 
-Root path: `/druid-ext/basic-security/authorization`
+Root path: `/druid-ext/basic-security/authorization`<br>
 
 Each API endpoint includes {authorizerName}, specifying which Authorizer instance is being configured.
 
 ##### User Creation/Deletion
-`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/users)`
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/users)`<br>
 Return a list of all user names.
 
-`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName})`
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName})`<br>
 Return the name and role information of the user with name {userName}
 
 Example output:
@@ -338,20 +596,20 @@ The `resourceNamePattern` is a compiled version of the resource name regex. It i
 }
 ```
 
-`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName})`
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName})`<br>
 Create a new user with name {userName}
 
-`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName})`
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName})`<br>
 Delete the user with name {userName}
 
 ##### Group mapping Creation/Deletion
-`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings)`
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings)`<br>
 Return a list of all group mappings.
 
-`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName})`
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName})`<br>
 Return the group mapping and role information of the group mapping with name {groupMappingName}
 
-`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName})`
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName})`<br>
 Create a new group mapping with name {groupMappingName}
 Content: JSON group mapping object
 Example request body:
@@ -366,14 +624,14 @@ Example request body:
 }
 ```
 
-`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName})`
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName})`<br>
 Delete the group mapping with name {groupMappingName}
 
 #### Role Creation/Deletion
-`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/roles)`
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/roles)`<br>
 Return a list of all role names.
 
-`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName})`
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName})`<br>
 Return name and permissions for the role named {roleName}.
 
 Example output:
@@ -427,30 +685,30 @@ Example output:
 ```
 
 
-`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName})`
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName})`<br>
 Create a new role with name {roleName}.
 Content: username string
 
-`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName})`
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName})`<br>
 Delete the role with name {roleName}.
 
 
 #### Role Assignment
-`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName}/roles/{roleName})`
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName}/roles/{roleName})`<br>
 Assign role {roleName} to user {userName}.
 
-`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName}/roles/{roleName})`
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName}/roles/{roleName})`<br>
 Unassign role {roleName} from user {userName}
 
-`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName}/roles/{roleName})`
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName}/roles/{roleName})`<br>
 Assign role {roleName} to group mapping {groupMappingName}.
 
-`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName}/roles/{roleName})`
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName}/roles/{roleName})`<br>
 Unassign role {roleName} from group mapping {groupMappingName}
 
 
 #### Permissions
-`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName}/permissions)`
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName}/permissions)`<br>
 Set the permissions of {roleName}. This replaces the previous set of permissions on the role.
 
 Content: List of JSON Resource-Action objects, e.g.:
@@ -479,5 +737,5 @@ The "name" field for resources in the permission definitions are regexes used to
 Please see [Defining permissions](../../operations/security-user-auth.md#defining-permissions) for more details.
 
 ##### Cache Load Status
-`GET(/druid-ext/basic-security/authorization/loadStatus)`
+`GET(/druid-ext/basic-security/authorization/loadStatus)`<br>
 Return the current load status of the local caches of the authorization Druid metadata store.
diff --git a/docs/development/extensions-core/druid-lookups.md b/docs/development/extensions-core/druid-lookups.md
index b44f9620bd0a..5b19508c2375 100644
--- a/docs/development/extensions-core/druid-lookups.md
+++ b/docs/development/extensions-core/druid-lookups.md
@@ -22,9 +22,6 @@ title: "Cached Lookup Module"
   ~ under the License.
   -->
 
-
-> Please note that this is an experimental module and the development/testing still at early stage. Feel free to try it and give us your feedback.
-
 ## Description
 This Apache Druid module provides a per-lookup caching mechanism for JDBC data sources.
 The main goal of this cache is to speed up the access to a high latency lookup sources and to provide a caching isolation for every lookup source.
diff --git a/docs/development/extensions-core/kafka-supervisor-reference.md b/docs/development/extensions-core/kafka-supervisor-reference.md
index 210207302f2d..360e75a83de4 100644
--- a/docs/development/extensions-core/kafka-supervisor-reference.md
+++ b/docs/development/extensions-core/kafka-supervisor-reference.md
@@ -56,8 +56,6 @@ This topic contains configuration reference information for the Apache Kafka sup
 
 ## Task Autoscaler Properties
 
-> Note that Task AutoScaler is currently designated as experimental.
-
 | Property | Description | Required |
 | ------------- | ------------- | ------------- |
 | `enableTaskAutoScaler` | Enable or disable autoscaling. `false` or blank disables the `autoScaler` even when `autoScalerConfig` is not null| no (default == false) |
@@ -206,8 +204,8 @@ The `tuningConfig` is optional and default parameters will be used if no `tuning
 | `handoffConditionTimeout`         | Long           | Milliseconds to wait for segment handoff. It must be >= 0, where 0 means to wait forever.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | no (default == 0)                                                                                            |
 | `resetOffsetAutomatically`        | Boolean        | Controls behavior when Druid needs to read Kafka messages that are no longer available (i.e. when `OffsetOutOfRangeException` is encountered).<br/><br/>If false, the exception will bubble up, which will cause your tasks to fail and ingestion to halt. If this occurs, manual intervention is required to correct the situation; potentially using the [Reset Supervisor API](../../operations/api-reference.md#supervisors). This mode is useful for production, since it will make you aware of issues with ingestion.<br/><br/>If true, Druid will automatically reset to the earlier or latest offset available in Kafka, based on the value of the `useEarliestOffset` property (earliest if true, latest if false). Note that this can lead to data being _DROPPED_ (if `useEarliestOffset` is false) or _DUPLICATED_ (if `useEarliestOffset` is true) without your knowledge. Messages will be logged indicating that a reset has occurred, but ingestion will continue. This mode is useful for non-production situations, since it will make Druid attempt to recover from problems automatically, even if they lead to quiet dropping or duplicating of data.<br/><br/>This feature behaves similarly to the Kafka `auto.offset.reset` consumer property. | no (default == false) |
 | `workerThreads`                   | Integer        | The number of threads that the supervisor uses to handle requests/responses for worker tasks, along with any other internal asynchronous operation.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              | no (default == min(10, taskCount))                                                                           |
-| `chatAsync`                       | Boolean        | If true, use asynchronous communication with indexing tasks, and ignore the `chatThreads` parameter. If false, use synchronous communication in a thread pool of size `chatThreads`.                                                                                                                                                                                                                                                                                                                                                                                                                                                                | no (default == false)                                                                |
-| `chatThreads`                     | Integer        | The number of threads that will be used for communicating with indexing tasks. Ignored if `chatAsync` is `true`.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    | no (default == min(10, taskCount * replicas))                                                                |
+| `chatAsync`                       | Boolean        | If true, use asynchronous communication with indexing tasks, and ignore the `chatThreads` parameter. If false, use synchronous communication in a thread pool of size `chatThreads`.                                                                                                                                                                                                                                                                                                                                                                                                                                                                | no (default == true)                                                                |
+| `chatThreads`                     | Integer        | The number of threads that will be used for communicating with indexing tasks. Ignored if `chatAsync` is `true` (the default).                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      | no (default == min(10, taskCount * replicas))                                                                |
 | `chatRetries`                     | Integer        | The number of times HTTP requests to indexing tasks will be retried before considering tasks unresponsive.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | no (default == 8)                                                                                            |
 | `httpTimeout`                     | ISO8601 Period | How long to wait for a HTTP response from an indexing task.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | no (default == PT10S)                                                                                        |
 | `shutdownTimeout`                 | ISO8601 Period | How long to wait for the supervisor to attempt a graceful shutdown of tasks before exiting.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | no (default == PT80S)                                                                                        |
diff --git a/docs/development/extensions-core/kinesis-ingestion.md b/docs/development/extensions-core/kinesis-ingestion.md
index 84036665ec9e..9b14ec767c26 100644
--- a/docs/development/extensions-core/kinesis-ingestion.md
+++ b/docs/development/extensions-core/kinesis-ingestion.md
@@ -149,8 +149,6 @@ Where the file `supervisor-spec.json` contains a Kinesis supervisor spec:
 
 #### Task Autoscaler Properties
 
-> Note that Task AutoScaler is currently designated as experimental.
-
 | Property | Description | Required |
 | ------------- | ------------- | ------------- |
 | `enableTaskAutoScaler` | Enable or disable the auto scaler. When false or absent, Druid disables the `autoScaler` even when `autoScalerConfig` is not null.| no (default == false) |
@@ -293,8 +291,8 @@ The `tuningConfig` is optional. If no `tuningConfig` is specified, default param
 |`resetOffsetAutomatically`|Boolean|Controls behavior when Druid needs to read Kinesis messages that are no longer available.<br/><br/>If false, the exception will bubble up, which will cause your tasks to fail and ingestion to halt. If this occurs, manual intervention is required to correct the situation; potentially using the [Reset Supervisor API](../../operations/api-reference.md#supervisors). This mode is useful for production, since it will make you aware of issues with ingestion.<br/><br/>If true, Druid will automatically reset to the earlier or latest sequence number available in Kinesis, based on the value of the `useEarliestSequenceNumber` property (earliest if true, latest if false). Please note that this can lead to data being _DROPPED_ (if `useEarliestSequenceNumber` is false) or _DUPLICATED_ (if `useEarliestSequenceNumber` is true) without your knowledge. Messages will be logged indicating that a reset has occurred, but ingestion will continue. This mode is useful for non-production situations, since it will make Druid attempt to recover from problems automatically, even if they lead to quiet dropping or duplicating of data.|no (default == false)|
 |`skipSequenceNumberAvailabilityCheck`|Boolean|Whether to enable checking if the current sequence number is still available in a particular Kinesis shard. If set to false, the indexing task will attempt to reset the current sequence number (or not), depending on the value of `resetOffsetAutomatically`.|no (default == false)|
 |`workerThreads`|Integer|The number of threads that the supervisor uses to handle requests/responses for worker tasks, along with any other internal asynchronous operation.|no (default == min(10, taskCount))|
-|`chatAsync`|Boolean| If true, use asynchronous communication with indexing tasks, and ignore the `chatThreads` parameter. If false, use synchronous communication in a thread pool of size `chatThreads`.                                                                                                                                                                                                                                                                                                                                                                                                                                                                | no (default == false)                                                                |
-|`chatThreads`|Integer| The number of threads that will be used for communicating with indexing tasks. Ignored if `chatAsync` is `true`.| no (default == min(10, taskCount * replicas))|
+|`chatAsync`|Boolean| If true, use asynchronous communication with indexing tasks, and ignore the `chatThreads` parameter. If false, use synchronous communication in a thread pool of size `chatThreads`.                                                                                                                                                                                                                                                                                                                                                                                                                                                                | no (default == true)                                                                |
+|`chatThreads`|Integer| The number of threads that will be used for communicating with indexing tasks. Ignored if `chatAsync` is `true` (the default).| no (default == min(10, taskCount * replicas))|
 |`chatRetries`|Integer|The number of times HTTP requests to indexing tasks will be retried before considering tasks unresponsive.| no (default == 8)|
 |`httpTimeout`|ISO8601 Period|How long to wait for a HTTP response from an indexing task.|no (default == PT10S)|
 |`shutdownTimeout`|ISO8601 Period|How long to wait for the supervisor to attempt a graceful shutdown of tasks before exiting.|no (default == PT80S)|
diff --git a/docs/ingestion/data-formats.md b/docs/ingestion/data-formats.md
index eb08df0cf7a8..557060a5e663 100644
--- a/docs/ingestion/data-formats.md
+++ b/docs/ingestion/data-formats.md
@@ -606,9 +606,9 @@ For example:
 
 ### FlattenSpec
 
-The `flattenSpec` object bridges the gap between potentially nested input data, such as Avro or ORC, and Druid's flat data model. It is an object within the `inputFormat` object.
+You can use the `flattenSpec` object to flatten nested data, as an alternative to the Druid [nested columns](../querying/nested-columns.md) feature, and for nested input formats unsupported by the feature. It is an object within the `inputFormat` object.
 
-> If you have nested JSON data, you can ingest and store JSON in an Apache Druid column as a `COMPLEX<json>` data type. See [Nested columns](../querying/nested-columns.md) for more information.
+See [Nested columns](../querying/nested-columns.md) for information on ingesting and storing nested data in an Apache Druid column as a `COMPLEX<json>` data type.
 
 Configure your `flattenSpec` as follows:
 
diff --git a/docs/ingestion/migrate-from-firehose-ingestion.md b/docs/ingestion/migrate-from-firehose-ingestion.md
new file mode 100644
index 000000000000..c5d3f6946f21
--- /dev/null
+++ b/docs/ingestion/migrate-from-firehose-ingestion.md
@@ -0,0 +1,209 @@
+---
+id: migrate-from-firehose
+title: "Migrate from firehose to input source ingestion"
+sidebar_label: "Migrate from firehose"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache deprecated support for Druid firehoses in version 0.17. Support for firehose ingestion will be removed in version 26.0.
+
+If you're using a firehose for batch ingestion, we strongly recommend that you follow the instructions on this page to transition to using native batch ingestion input sources as soon as possible. 
+
+Firehose ingestion doesn't work with newer Druid versions, so you must be using an ingestion spec with a defined input source before you upgrade. 
+
+## Migrate from firehose ingestion to an input source
+
+To migrate from firehose ingestion, you can use the Druid console to update your ingestion spec, or you can update it manually.
+
+### Use the Druid console
+
+To update your ingestion spec using the Druid console, open the console and copy your spec into the **Edit spec** stage of the data loader.
+
+Druid converts the spec into one with a defined input source. For example, it converts the [example firehose ingestion spec](#example-firehose-ingestion-spec) below into the [example ingestion spec after migration](#example-ingestion-spec-after-migration).
+
+If you're unable to use the console or you have problems with the console method, the alternative is to update your ingestion spec manually.
+
+### Update your ingestion spec manually
+
+To update your ingestion spec manually, copy your existing spec into a new file. Refer to [Native batch ingestion with firehose (Deprecated)](./native-batch-firehose.md) for a description of firehose properties.
+
+Edit the new file as follows:
+
+1. In the `ioConfig` component, replace the `firehose` definition with an `inputSource` definition for your chosen input source. See [Native batch input sources](./native-batch-input-source.md) for details.
+2. Move the `timeStampSpec` definition from `parser.parseSpec` to the `dataSchema` component.
+3. Move the `dimensionsSpec` definition from `parser.parseSpec` to the `dataSchema` component.
+4. Move the `format` definition from `parser.parseSpec` to an `inputFormat` definition in `ioConfig`.
+5. Delete the `parser` definition.
+6. Save the file.
+<br>You can check the format of your new ingestion file against the [migrated example](#example-ingestion-spec-after-migration) below.
+7. Test the new ingestion spec with a temporary data source.
+8. Once you've successfully ingested sample data with the new spec, stop firehose ingestion and switch to the new spec.
+
+When the transition is complete, you can upgrade Druid to the latest version. See the [Druid release notes](https://druid.apache.org/downloads.html) for upgrade instructions.
+
+### Example firehose ingestion spec
+
+An example firehose ingestion spec is as follows:
+
+```json
+{
+  "type" : "index",
+  "spec" : {
+     "dataSchema" : {
+        "dataSource" : "wikipedia",
+        "metricsSpec" : [
+           {
+              "type" : "count",
+              "name" : "count"
+           },
+           {
+              "type" : "doubleSum",
+              "name" : "added",
+              "fieldName" : "added"
+           },
+           {
+              "type" : "doubleSum",
+              "name" : "deleted",
+              "fieldName" : "deleted"
+           },
+           {
+              "type" : "doubleSum",
+              "name" : "delta",
+              "fieldName" : "delta"
+           }
+        ],
+        "granularitySpec" : {
+           "type" : "uniform",
+           "segmentGranularity" : "DAY",
+           "queryGranularity" : "NONE",
+           "intervals" : [ "2013-08-31/2013-09-01" ]
+        },
+        "parser": {
+           "type": "string",
+           "parseSpec": {
+              "format": "json",
+              "timestampSpec" : {
+                 "column" : "timestamp",
+                 "format" : "auto"
+              },
+              "dimensionsSpec" : {
+                 "dimensions": ["country", "page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","region","city"],
+                 "dimensionExclusions" : []
+              }
+           }
+        }
+     },
+     "ioConfig" : {
+        "type" : "index",
+        "firehose" : {
+           "type" : "local",
+           "baseDir" : "examples/indexing/",
+           "filter" : "wikipedia_data.json"
+        }
+     },
+     "tuningConfig" : {
+        "type" : "index",
+        "partitionsSpec": {
+           "type": "single_dim",
+           "partitionDimension": "country",
+           "targetRowsPerSegment": 5000000
+        }
+     }
+  }
+}
+```
+
+### Example ingestion spec after migration
+
+The following example illustrates the result of migrating the [example firehose ingestion spec](#example-firehose-ingestion-spec) to a spec with an input source:
+
+```json
+{
+ "type" : "index",
+ "spec" : {
+   "dataSchema" : {
+     "dataSource" : "wikipedia",
+     "timestampSpec" : {
+       "column" : "timestamp",
+       "format" : "auto"
+     },
+     "dimensionsSpec" : {
+       "dimensions": ["country", "page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","region","city"],
+       "dimensionExclusions" : []
+     },
+     "metricsSpec" : [
+       {
+         "type" : "count",
+         "name" : "count"
+       },
+       {
+         "type" : "doubleSum",
+         "name" : "added",
+         "fieldName" : "added"
+       },
+       {
+         "type" : "doubleSum",
+         "name" : "deleted",
+         "fieldName" : "deleted"
+       },
+       {
+         "type" : "doubleSum",
+         "name" : "delta",
+         "fieldName" : "delta"
+       }
+     ],
+     "granularitySpec" : {
+       "type" : "uniform",
+       "segmentGranularity" : "DAY",
+       "queryGranularity" : "NONE",
+       "intervals" : [ "2013-08-31/2013-09-01" ]
+     }
+   },
+   "ioConfig" : {
+     "type" : "index",
+     "inputSource" : {
+       "type" : "local",
+       "baseDir" : "examples/indexing/",
+       "filter" : "wikipedia_data.json"
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+   },
+   "tuningConfig" : {
+     "type" : "index",
+     "partitionsSpec": {
+       "type": "single_dim",
+       "partitionDimension": "country",
+       "targetRowsPerSegment": 5000000
+     }
+   }
+ }
+}
+```
+
+## Learn more
+
+For more information, see the following pages:
+
+- [Ingestion](./index.md): Overview of the Druid ingestion process.
+- [Native batch ingestion](./native-batch.md): Description of the supported native batch indexing tasks.
+- [Ingestion spec reference](./ingestion-spec.md): Description of the components and properties in the ingestion spec.
diff --git a/docs/ingestion/native-batch-firehose.md b/docs/ingestion/native-batch-firehose.md
index 4e2cad97fc1a..ca848e725c87 100644
--- a/docs/ingestion/native-batch-firehose.md
+++ b/docs/ingestion/native-batch-firehose.md
@@ -1,6 +1,6 @@
 ---
 id: native-batch-firehose
-title: "Native batch ingestion with firehose"
+title: "Native batch ingestion with firehose (Deprecated)"
 sidebar_label: "Firehose (deprecated)"
 ---
 
@@ -23,14 +23,13 @@ sidebar_label: "Firehose (deprecated)"
   ~ under the License.
   -->
 
-
-Firehoses are deprecated in 0.17.0. It's highly recommended to use the [Native batch ingestion input sources](./native-batch-input-source.md) instead.
+> Firehose ingestion is deprecated. See [Migrate from firehose to input source ingestion](./migrate-from-firehose-ingestion.md) for instructions on migrating from firehose ingestion to using native batch ingestion input sources.
 
 There are several firehoses readily available in Druid, some are meant for examples, others can be used directly in a production environment.
 
 ## StaticS3Firehose
 
-> You need to include the [`druid-s3-extensions`](../development/extensions-core/s3.md) as an extension to use the StaticS3Firehose.
+You need to include the [`druid-s3-extensions`](../development/extensions-core/s3.md) as an extension to use the StaticS3Firehose.
 
 This firehose ingests events from a predefined list of S3 objects.
 This firehose is _splittable_ and can be used by the [Parallel task](./native-batch.md).
@@ -62,7 +61,7 @@ Note that prefetching or caching isn't that useful in the Parallel task.
 
 ## StaticGoogleBlobStoreFirehose
 
-> You need to include the [`druid-google-extensions`](../development/extensions-core/google.md) as an extension to use the StaticGoogleBlobStoreFirehose.
+You need to include the [`druid-google-extensions`](../development/extensions-core/google.md) as an extension to use the StaticGoogleBlobStoreFirehose.
 
 This firehose ingests events, similar to the StaticS3Firehose, but from an Google Cloud Store.
 
@@ -112,7 +111,7 @@ Google Blobs:
 
 ## HDFSFirehose
 
-> You need to include the [`druid-hdfs-storage`](../development/extensions-core/hdfs.md) as an extension to use the HDFSFirehose.
+You need to include the [`druid-hdfs-storage`](../development/extensions-core/hdfs.md) as an extension to use the HDFSFirehose.
 
 This firehose ingests events from a predefined list of files from the HDFS storage.
 This firehose is _splittable_ and can be used by the [Parallel task](./native-batch.md).
diff --git a/docs/ingestion/native-batch.md b/docs/ingestion/native-batch.md
index 7106a9a000a3..e8d83f34046a 100644
--- a/docs/ingestion/native-batch.md
+++ b/docs/ingestion/native-batch.md
@@ -679,8 +679,7 @@ Returns the task attempt history of the worker task spec of the given id, or HTT
 While ingesting data using the parallel task indexing, Druid creates segments from the input data and pushes them. For segment pushing,
 the parallel task index supports the following segment pushing modes based upon your type of [rollup](./rollup.md):
 
-- Bulk pushing mode: Used for perfect rollup. Druid pushes every segment at the very end of the index task. Until then, Druid stores created segments in memory and local storage of the service running the index task. This mode can cause problems if you have limited storage capacity, and is not recommended to use in production.
-To enable bulk pushing mode, set `forceGuaranteedRollup` in your TuningConfig. You cannot use bulk pushing with `appendToExisting` in your IOConfig.
+- Bulk pushing mode: Used for perfect rollup. Druid pushes every segment at the very end of the index task. Until then, Druid stores created segments in memory and local storage of the service running the index task. To enable bulk pushing mode, set `forceGuaranteedRollup` to `true` in your tuning config. You cannot use bulk pushing with `appendToExisting` in your IOConfig.
 - Incremental pushing mode: Used for best-effort rollup. Druid pushes segments are incrementally during the course of the indexing task. The index task collects data and stores created segments in the memory and disks of the services running the task until the total number of collected rows exceeds `maxTotalRows`. At that point the index task immediately pushes all segments created up until that moment, cleans up pushed segments, and continues to ingest the remaining data.
 
 ## Capacity planning
diff --git a/docs/ingestion/schema-design.md b/docs/ingestion/schema-design.md
index 10e6ea82cd2b..f006e792bc44 100644
--- a/docs/ingestion/schema-design.md
+++ b/docs/ingestion/schema-design.md
@@ -116,14 +116,13 @@ naturally emitted. It is also useful if you want to combine timeseries and non-t
 Similar to log aggregation systems, Druid offers inverted indexes for fast searching and filtering. Druid's search
 capabilities are generally less developed than these systems, and its analytical capabilities are generally more
 developed. The main data modeling differences between Druid and these systems are that when ingesting data into Druid,
-you must be more explicit. Druid columns have types specific upfront and Druid does not, at this time, natively support
-nested data.
+you must be more explicit. Druid columns have types specific upfront.
 
 Tips for modeling log data in Druid:
 
 * If you don't know ahead of time what columns you'll want to ingest, use an empty dimensions list to trigger
 [automatic detection of dimension columns](#schema-less-dimensions).
-* If you have nested data, flatten it using a [`flattenSpec`](./ingestion-spec.md#flattenspec).
+* If you have nested data, you can ingest it using the [nested columns](../querying/nested-columns.md) feature or flatten it using a [`flattenSpec`](./ingestion-spec.md#flattenspec).
 * Consider enabling [rollup](./rollup.md) if you have mainly analytical use cases for your log data. This will
 mean you lose the ability to retrieve individual events from Druid, but you potentially gain substantial compression and
 query performance boosts.
@@ -198,9 +197,9 @@ like `MILLIS_TO_TIMESTAMP`, `TIME_FLOOR`, and others. If you're using native Dru
 
 ### Nested dimensions
 
-You can ingest and store nested JSON in a Druid column as a `COMPLEX<json>` data type. See [Nested columns](../querying/nested-columns.md) for more information.
+You can ingest and store nested data in a Druid column as a `COMPLEX<json>` data type. See [Nested columns](../querying/nested-columns.md) for more information.
 
-If you want to ingest nested data in a format other than JSON&mdash;for example Avro, ORC, and Parquet&mdash;you  must use the `flattenSpec` object to flatten it. For example, if you have data of the following form:
+If you want to ingest nested data in a format unsupported by the nested columns feature, you  must use the `flattenSpec` object to flatten it. For example, if you have data of the following form:
 
 ```json
 { "foo": { "bar": 3 } }
diff --git a/docs/ingestion/tasks.md b/docs/ingestion/tasks.md
index c8a2e915d472..5afbadb3d43a 100644
--- a/docs/ingestion/tasks.md
+++ b/docs/ingestion/tasks.md
@@ -343,6 +343,26 @@ You can override the task priority by setting your priority in the task context
   "priority" : 100
 }
 ```
+<a name="actions"></a>
+
+## Task actions
+
+Task actions are overlord actions performed by tasks during their lifecycle. Some typical task actions are:
+- `lockAcquire`: acquires a time-chunk lock on an interval for the task
+- `lockRelease`: releases a lock acquired by the task on an interval
+- `segmentTransactionalInsert`: publishes new segments created by a task and optionally overwrites and/or drops existing segments in a single transaction
+- `segmentAllocate`: allocates pending segments to a task to write rows
+
+### Batching `segmentAllocate` actions
+
+In a cluster with several concurrent tasks, `segmentAllocate` actions on the overlord can take a long time to finish, causing spikes in the `task/action/run/time`. This can result in ingestion lag building up while a task waits for a segment to be allocated.
+The root cause of such spikes is likely to be one or more of the following:
+- several concurrent tasks trying to allocate segments for the same datasource and interval
+- large number of metadata calls made to the segments and pending segments tables 
+- concurrency limitations while acquiring a task lock required for allocating a segment
+
+Since the contention typically arises from tasks allocating segments for the same datasource and interval, you can improve the run times by batching the actions together.
+To enable batched segment allocation on the overlord, set  `druid.indexer.tasklock.batchSegmentAllocation` to `true`. See [overlord configuration](../configuration/index.md#overlord-operations) for more details.
 
 <a name="context"></a>
 
diff --git a/docs/multi-stage-query/concepts.md b/docs/multi-stage-query/concepts.md
index 44e5ea43d427..da0e774152d6 100644
--- a/docs/multi-stage-query/concepts.md
+++ b/docs/multi-stage-query/concepts.md
@@ -233,7 +233,8 @@ happens:
 The [`maxNumTasks`](./reference.md#context-parameters) query parameter determines the maximum number of tasks your
 query will use, including the one `query_controller` task. Generally, queries perform better with more workers. The
 lowest possible value of `maxNumTasks` is two (one worker and one controller). Do not set this higher than the number of
-free slots available in your cluster; doing so will result in a [TaskStartTimeout](reference.md#error-codes) error.
+free slots available in your cluster; doing so will result in a [TaskStartTimeout](reference.md#error_TaskStartTimeout)
+error.
 
 When [reading external data](#extern), EXTERN can read multiple files in parallel across
 different worker tasks. However, EXTERN does not split individual files across multiple worker tasks. If you have a
diff --git a/docs/multi-stage-query/known-issues.md b/docs/multi-stage-query/known-issues.md
index c76ab57aa7ac..648d3c297b47 100644
--- a/docs/multi-stage-query/known-issues.md
+++ b/docs/multi-stage-query/known-issues.md
@@ -33,16 +33,18 @@ sidebar_label: Known issues
 
 - Worker task stage outputs are stored in the working directory given by `druid.indexer.task.baseDir`. Stages that
 generate a large amount of output data may exhaust all available disk space. In this case, the query fails with
-an [UnknownError](./reference.md#error-codes) with a message including "No space left on device".
+an [UnknownError](./reference.md#error_UnknownError) with a message including "No space left on device".
 
 ## SELECT
 
 - SELECT from a Druid datasource does not include unpublished real-time data.
 
 - GROUPING SETS and UNION ALL are not implemented. Queries using these features return a
-  [QueryNotSupported](reference.md#error-codes) error. 
+  [QueryNotSupported](reference.md#error_QueryNotSupported) error.
 
-- For some COUNT DISTINCT queries, you'll encounter a [QueryNotSupported](reference.md#error-codes) error that includes `Must not have 'subtotalsSpec'` as one of its causes. This is caused by the planner attempting to use GROUPING SETs, which are not implemented.
+- For some COUNT DISTINCT queries, you'll encounter a [QueryNotSupported](reference.md#error_QueryNotSupported) error
+  that includes `Must not have 'subtotalsSpec'` as one of its causes. This is caused by the planner attempting to use
+  GROUPING SETs, which are not implemented.
 
 - The numeric varieties of the EARLIEST and LATEST aggregators do not work properly. Attempting to use the numeric
   varieties of these aggregators lead to an error like
diff --git a/docs/multi-stage-query/reference.md b/docs/multi-stage-query/reference.md
index 3550566874b8..8ea9adf61ae6 100644
--- a/docs/multi-stage-query/reference.md
+++ b/docs/multi-stage-query/reference.md
@@ -32,9 +32,9 @@ sidebar_label: Reference
 This topic is a reference guide for the multi-stage query architecture in Apache Druid. For examples of real-world
 usage, refer to the [Examples](examples.md) page.
 
-### EXTERN
+### `EXTERN`
 
-Use the EXTERN function to read external data.
+Use the `EXTERN` function to read external data.
 
 Function format:
 
@@ -50,7 +50,7 @@ FROM TABLE(
 )
 ```
 
-EXTERN consists of the following parts:
+`EXTERN` consists of the following parts:
 
 1. Any [Druid input source](../ingestion/native-batch-input-source.md) as a JSON-encoded string.
 2. Any [Druid input format](../ingestion/data-formats.md) as a JSON-encoded string.
@@ -58,12 +58,134 @@ EXTERN consists of the following parts:
 
 For more information, see [Read external data with EXTERN](concepts.md#extern).
 
-### INSERT
+### `HTTP`, `INLINE` and `LOCALFILES`
 
-Use the INSERT statement to insert data.
+While `EXTERN` allows you to specify an external table using JSON, other table functions allow you
+describe the external table using SQL syntax. Each function works for one specific kind of input
+source. You provide properties using SQL named arguments. The row signature is given using the
+Druid SQL `EXTEND` keyword using SQL syntax and types. Function format:
 
-Unlike standard SQL, INSERT loads data into the target table according to column name, not positionally. If necessary,
-use `AS` in your SELECT column list to assign the correct names. Do not rely on their positions within the SELECT
+```sql
+SELECT
+ <column>
+FROM TABLE(
+  http(
+    userName => 'bob',
+    password => 'secret',
+    uris => 'http:foo.com/bar.csv',
+    format => 'csv'
+    )
+  ) EXTEND (x VARCHAR, y VARCHAR, z BIGINT)
+```
+
+Note that the `EXTEND` keyword is optional. The following is equally valid (and perhaps
+more convenient):
+
+```sql
+SELECT
+ <column>
+FROM TABLE(
+  http(
+    userName => 'bob',
+    password => 'secret',
+    uris => 'http:foo.com/bar.csv',
+    format => 'csv'
+    )
+  ) (x VARCHAR, y VARCHAR, z BIGINT)
+```
+
+
+The set of table functions and formats is preliminary in this release.
+
+#### `HTTP`
+
+The `HTTP` table function represents the `HttpInputSource` class in Druid which allows you to
+read from an HTTP server. The function accepts the following arguments:
+
+| Name | Description | JSON equivalent | Required |
+| ---- | ----------- | --------------- | -------- |
+| `userName` | Basic authentication user name | `httpAuthenticationUsername` | No |
+| `password` | Basic authentication password | `httpAuthenticationPassword` | No |
+| `passwordEnvVar` | Environment variable that contains the basic authentication password| `httpAuthenticationPassword` | No |
+| `uris` | Comma-separated list of URIs to read. | `uris` | Yes |
+
+#### `INLINE`
+
+The `INLINE` table function represents the `InlineInputSource` class in Druid which provides
+data directly in the table function. The function accepts the following arguments:
+
+| Name | Description | JSON equivalent | Required |
+| ---- | ----------- | --------------- | -------- |
+| `data` | Text lines of inline data. Separate lines with a newline. | `data` | Yes |
+
+#### `LOCALFILES`
+
+The `LOCALFILES` table function represents the `LocalInputSource` class in Druid which reads
+files from the file system of the node running Druid. This is most useful for single-node
+installations. The function accepts the following arguments:
+
+| Name | Description | JSON equivalent | Required |
+| ---- | ----------- | --------------- | -------- |
+| `baseDir` | Directory to read from. | `baseDir` | No |
+| `filter` | Filter pattern to read. Example: `*.csv`. | `filter` | No |
+| `files` | Comma-separated list of files to read. | `files` | No |
+
+You must either provide the `baseDir` or the list of `files`. You can provide both, in which case
+the files are assumed relative to the `baseDir`. If you provide a `filter`, you must provide the
+`baseDir`.
+
+Note that, due to [Issue #13359](https://github.com/apache/druid/issues/13359), the functionality
+described above is broken. Until that issue is resolved, you must provide one or more absolute
+file paths in the `files` property and the other two properties are unavailable.
+
+#### Table Function Format
+
+Each of the table functions above requires that you specify a format.
+
+| Name | Description | JSON equivalent | Required |
+| ---- | ----------- | --------------- | -------- |
+| `format` | The input format, using the same names as for `EXTERN`. | `inputFormat.type` | Yes |
+
+#### CSV Format
+
+Use the `csv` format to read from CSV. This choice selects the Druid `CsvInputFormat` class.
+
+| Name | Description | JSON equivalent | Required |
+| ---- | ----------- | --------------- | -------- |
+| `listDelimiter` | The delimiter to use for fields that represent a list of strings. | `listDelimiter` | No |
+| `skipRows` | The number of rows to skip at the start of the file. Default is 0. | `skipHeaderRows` | No |
+
+MSQ does not have the ability to infer schema from a CSV, file, so the `findColumnsFromHeader` property
+is unavailable. Instead, Columns are given using the `EXTEND` syntax described above.
+
+#### Delimited Text Format
+
+Use the `tsv` format to read from an arbitrary delimited (CSV-like) file such as tab-delimited,
+pipe-delimited, etc. This choice selects the Druid `DelimitedInputFormat` class.
+
+| Name | Description | JSON equivalent | Required |
+| ---- | ----------- | --------------- | -------- |
+| `delimiter` | The delimiter which separates fields. | `delimiter` | Yes |
+| `listDelimiter` | The delimiter to use for fields that represent a list of strings. | `listDelimiter` | No |
+| `skipRows` | The number of rows to skip at the start of the file. Default is 0. | `skipHeaderRows` | No |
+
+As noted above, MSQ cannot infer schema using headers. Use `EXTEND` instead.
+
+#### JSON Format
+
+Use the `json` format to read from a JSON input source. This choice selects the Druid `JsonInputFormat` class.
+
+| Name | Description | JSON equivalent | Required |
+| ---- | ----------- | --------------- | -------- |
+| `keepNulls` | Whether to keep null values. Defaults to `false`. | `keepNullColumns` | No |
+
+
+### `INSERT`
+
+Use the `INSERT` statement to insert data.
+
+Unlike standard SQL, `INSERT` loads data into the target table according to column name, not positionally. If necessary,
+use `AS` in your `SELECT` column list to assign the correct names. Do not rely on their positions within the SELECT
 clause.
 
 Statement format:
@@ -85,15 +207,15 @@ INSERT consists of the following parts:
 
 For more information, see [Load data with INSERT](concepts.md#insert).
 
-### REPLACE
+### `REPLACE`
 
-You can use the REPLACE function to replace all or some of the data.
+You can use the `REPLACE` function to replace all or some of the data.
 
-Unlike standard SQL, REPLACE loads data into the target table according to column name, not positionally. If necessary,
-use `AS` in your SELECT column list to assign the correct names. Do not rely on their positions within the SELECT
+Unlike standard SQL, `REPLACE` loads data into the target table according to column name, not positionally. If necessary,
+use `AS` in your `SELECT` column list to assign the correct names. Do not rely on their positions within the SELECT
 clause.
 
-#### REPLACE all data
+#### `REPLACE` all data
 
 Function format to replace all data:
 
@@ -105,7 +227,7 @@ PARTITIONED BY <time granularity>
 [ CLUSTERED BY <column list> ]
 ```
 
-#### REPLACE specific time ranges
+#### `REPLACE` specific time ranges
 
 Function format to replace specific time ranges:
 
@@ -117,7 +239,7 @@ PARTITIONED BY <time granularity>
 [ CLUSTERED BY <column list> ]
 ```
 
-REPLACE consists of the following parts:
+`REPLACE` consists of the following parts:
 
 1. Optional [context parameters](./reference.md#context-parameters).
 2. A `REPLACE INTO <dataSource>` clause at the start of your query, such as `REPLACE INTO "your-table".`
@@ -132,7 +254,7 @@ REPLACE consists of the following parts:
 
 For more information, see [Overwrite data with REPLACE](concepts.md#replace).
 
-### PARTITIONED BY
+### `PARTITIONED BY`
 
 The `PARTITIONED BY <time granularity>` clause is required for [INSERT](#insert) and [REPLACE](#replace). See
 [Partitioning](concepts.md#partitioning) for details.
@@ -164,7 +286,7 @@ The following ISO 8601 periods are supported for `TIME_FLOOR`:
 
 For more information about partitioning, see [Partitioning](concepts.md#partitioning).
 
-### CLUSTERED BY
+### `CLUSTERED BY`
 
 The `CLUSTERED BY <column list>` clause is optional for [INSERT](#insert) and [REPLACE](#replace). It accepts a list of
 column names or expressions.
@@ -203,14 +325,37 @@ The following table lists the context parameters for the MSQ task engine:
 | `maxParseExceptions`| SELECT, INSERT, REPLACE<br /><br />Maximum number of parse exceptions that are ignored while executing the query before it stops with `TooManyWarningsFault`. To ignore all the parse exceptions, set the value to -1.| 0 |
 | `rowsPerSegment` | INSERT or REPLACE<br /><br />The number of rows per segment to target. The actual number of rows per segment may be somewhat higher or lower than this number. In most cases, use the default. For general information about sizing rows per segment, see [Segment Size Optimization](../operations/segment-optimization.md). | 3,000,000 |
 | `indexSpec` | INSERT or REPLACE<br /><br />An [`indexSpec`](../ingestion/ingestion-spec.md#indexspec) to use when generating segments. May be a JSON string or object. See [Front coding](../ingestion/ingestion-spec.md#front-coding) for details on configuring an `indexSpec` with front coding. | See [`indexSpec`](../ingestion/ingestion-spec.md#indexspec). |
+| `clusterStatisticsMergeMode` | Whether to use parallel or sequential mode for merging of the worker sketches. Can be `PARALLEL`, `SEQUENTIAL` or `AUTO`. See [Sketch Merging Mode](#sketch-merging-mode) for more information. | `AUTO` |
+
+## Sketch Merging Mode
+This section details the advantages and performance of various Cluster By Statistics Merge Modes.
+
+If a query requires key statistics to generate partition boundaries, key statistics are gathered by the workers while
+reading rows from the datasource. These statistics must be transferred to the controller to be merged together.
+`clusterStatisticsMergeMode` configures the way in which this happens.
+
+`PARALLEL` mode fetches the key statistics for all time chunks from all workers together and the controller then downsamples
+the sketch if it does not fit in memory. This is faster than `SEQUENTIAL` mode as there is less over head in fetching sketches
+for all time chunks together. This is good for small sketches which won't be downsampled even if merged together or if
+accuracy in segment sizing for the ingestion is not very important.
+
+`SEQUENTIAL` mode fetches the sketches in ascending order of time and generates the partition boundaries for one time
+chunk at a time. This gives more working memory to the controller for merging sketches, which results in less
+downsampling and thus, more accuracy. There is, however, a time overhead on fetching sketches in sequential order. This is
+good for cases where accuracy is important.
+
+`AUTO` mode tries to find the best approach based on number of workers and size of input rows. If there are more
+than 100 workers or if the combined sketch size among all workers is more than 1GB, `SEQUENTIAL` is chosen, otherwise,
+`PARALLEL` is chosen.
 
 ## Durable Storage
+
 This section enumerates the advantages and performance implications of enabling durable storage while executing MSQ tasks.
 
 To prevent durable storage from getting filled up with temporary files in case the tasks fail to clean them up, a periodic
 cleaner can be scheduled to clean the directories corresponding to which there isn't a controller task running. It utilizes
-the storage connector to work upon the durable storage. The durable storage location should only be utilized to store the output 
-for cluster's MSQ tasks. If the location contains other files or directories, then they will get cleaned up as well. 
+the storage connector to work upon the durable storage. The durable storage location should only be utilized to store the output
+for cluster's MSQ tasks. If the location contains other files or directories, then they will get cleaned up as well.
 Following table lists the properties that can be set to control the behavior of the durable storage of the cluster.
 
 |Parameter          |Default                                 | Description          |
@@ -227,14 +372,14 @@ The following table lists query limits:
 
 | Limit | Value | Error if exceeded |
 |---|---|---|
-| Size of an individual row written to a frame. Row size when written to a frame may differ from the original row size. | 1 MB | `RowTooLarge` |
-| Number of segment-granular time chunks encountered during ingestion. | 5,000 | `TooManyBuckets` |
-| Number of input files/segments per worker. | 10,000 | `TooManyInputFiles` |
-| Number of output partitions for any one stage. Number of segments generated during ingestion. |25,000 | `TooManyPartitions` |
-| Number of output columns for any one stage. | 2,000 | `TooManyColumns` |
-| Number of cluster by columns that can appear in a stage | 1,500 | `TooManyClusteredByColumns` |
-| Number of workers for any one stage. | Hard limit is 1,000. Memory-dependent soft limit may be lower. | `TooManyWorkers` |
-| Maximum memory occupied by broadcasted tables. | 30% of each [processor memory bundle](concepts.md#memory-usage). | `BroadcastTablesTooLarge` |
+| Size of an individual row written to a frame. Row size when written to a frame may differ from the original row size. | 1 MB | [`RowTooLarge`](#error_RowTooLarge) |
+| Number of segment-granular time chunks encountered during ingestion. | 5,000 | [`TooManyBuckets`](#error_TooManyBuckets) |
+| Number of input files/segments per worker. | 10,000 | [`TooManyInputFiles`](#error_TooManyInputFiles) |
+| Number of output partitions for any one stage. Number of segments generated during ingestion. |25,000 | [`TooManyPartitions`](#error_TooManyPartitions) |
+| Number of output columns for any one stage. | 2,000 | [`TooManyColumns`](#error_TooManyColumns) |
+| Number of cluster by columns that can appear in a stage | 1,500 | [`TooManyClusteredByColumns`](#error_TooManyClusteredByColumns) |
+| Number of workers for any one stage. | Hard limit is 1,000. Memory-dependent soft limit may be lower. | [`TooManyWorkers`](#error_TooManyWorkers) |
+| Maximum memory occupied by broadcasted tables. | 30% of each [processor memory bundle](concepts.md#memory-usage). | [`BroadcastTablesTooLarge`](#error_BroadcastTablesTooLarge) |
 
 <a name="errors"></a>
 
@@ -244,30 +389,30 @@ The following table describes error codes you may encounter in the `multiStageQu
 
 | Code | Meaning | Additional fields |
 |---|---|---|
-| `BroadcastTablesTooLarge` | The size of the broadcast tables used in the right hand side of the join exceeded the memory reserved for them in a worker task.<br /><br />Try increasing the peon memory or reducing the size of the broadcast tables. | `maxBroadcastTablesSize`: Memory reserved for the broadcast tables, measured in bytes. |
-| `Canceled` | The query was canceled. Common reasons for cancellation:<br /><br /><ul><li>User-initiated shutdown of the controller task via the `/druid/indexer/v1/task/{taskId}/shutdown` API.</li><li>Restart or failure of the server process that was running the controller task.</li></ul>| |
-| `CannotParseExternalData` | A worker task could not parse data from an external datasource. | `errorMessage`: More details on why parsing failed. |
-| `ColumnNameRestricted` | The query uses a restricted column name. | `columnName`: The restricted column name. |
-| `ColumnTypeNotSupported` | The column type is not supported. This can be because:<br /> <br /><ul><li>Support for writing or reading from a particular column type is not supported.</li><li>The query attempted to use a column type that is not supported by the frame format. This occurs with ARRAY types, which are not yet implemented for frames.</li></ul> | `columnName`: The column name with an unsupported type.<br /> <br />`columnType`: The unknown column type. |
-| `InsertCannotAllocateSegment` | The controller task could not allocate a new segment ID due to conflict with existing segments or pending segments. Common reasons for such conflicts:<br /> <br /><ul><li>Attempting to mix different granularities in the same intervals of the same datasource.</li><li>Prior ingestions that used non-extendable shard specs.</li></ul>| `dataSource`<br /> <br />`interval`: The interval for the attempted new segment allocation. |
-| `InsertCannotBeEmpty` | An INSERT or REPLACE query did not generate any output rows in a situation where output rows are required for success. This can happen for INSERT or REPLACE queries with `PARTITIONED BY` set to something other than `ALL` or `ALL TIME`. | `dataSource` |
-| `InsertCannotOrderByDescending` | An INSERT query contained a `CLUSTERED BY` expression in descending order. Druid's segment generation code only supports ascending order. | `columnName` |
-| `InsertCannotReplaceExistingSegment` | A REPLACE query cannot proceed because an existing segment partially overlaps those bounds, and the portion within the bounds is not fully overshadowed by query results. <br /> <br />There are two ways to address this without modifying your query:<ul><li>Shrink the OVERLAP filter to match the query results.</li><li>Expand the OVERLAP filter to fully contain the existing segment.</li></ul>| `segmentId`: The existing segment <br />
-| `InsertLockPreempted` | An INSERT or REPLACE query was canceled by a higher-priority ingestion job, such as a real-time ingestion task. | |
-| `InsertTimeNull` | An INSERT or REPLACE query encountered a null timestamp in the `__time` field.<br /><br />This can happen due to using an expression like `TIME_PARSE(timestamp) AS __time` with a timestamp that cannot be parsed. (TIME_PARSE returns null when it cannot parse a timestamp.) In this case, try parsing your timestamps using a different function or pattern.<br /><br />If your timestamps may genuinely be null, consider using COALESCE to provide a default value. One option is CURRENT_TIMESTAMP, which represents the start time of the job. |
-| `InsertTimeOutOfBounds` | A REPLACE query generated a timestamp outside the bounds of the TIMESTAMP parameter for your OVERWRITE WHERE clause.<br /> <br />To avoid this error, verify that the you specified is valid. | `interval`: time chunk interval corresponding to the out-of-bounds timestamp |
-| `InvalidNullByte` | A string column included a null byte. Null bytes in strings are not permitted. | `column`: The column that included the null byte |
-| `QueryNotSupported` | QueryKit could not translate the provided native query to a multi-stage query.<br /> <br />This can happen if the query uses features that aren't supported, like GROUPING SETS. | |
-| `RowTooLarge` | The query tried to process a row that was too large to write to a single frame. See the [Limits](#limits) table for the specific limit on frame size. Note that the effective maximum row size is smaller than the maximum frame size due to alignment considerations during frame writing. | `maxFrameSize`: The limit on the frame size. |
-| `TaskStartTimeout` | Unable to launch all the worker tasks in time. <br /> <br />There might be insufficient available slots to start all the worker tasks simultaneously.<br /> <br /> Try splitting up the query into smaller chunks with lesser `maxNumTasks` number. Another option is to increase capacity. | `numTasks`: The number of tasks attempted to launch. |
-| `TooManyBuckets` | Exceeded the number of partition buckets for a stage. Partition buckets are only used for `segmentGranularity` during INSERT queries. The most common reason for this error is that your `segmentGranularity` is too narrow relative to the data. See the [Limits](#limits) table for the specific limit. | `maxBuckets`: The limit on buckets. |
-| `TooManyInputFiles` | Exceeded the number of input files/segments per worker. See the [Limits](#limits) table for the specific limit. | `numInputFiles`: The total number of input files/segments for the stage.<br /><br />`maxInputFiles`: The maximum number of input files/segments per worker per stage.<br /><br />`minNumWorker`: The minimum number of workers required for a successful run. |
-| `TooManyPartitions` | Exceeded the number of partitions for a stage. The most common reason for this is that the final stage of an INSERT or REPLACE query generated too many segments. See the [Limits](#limits) table for the specific limit. | `maxPartitions`: The limit on partitions which was exceeded |
-|  `TooManyClusteredByColumns`  | Exceeded the number of cluster by columns for a stage. See the [Limits](#limits) table for the specific limit. | `numColumns`: The number of columns requested.<br /><br />`maxColumns`: The limit on columns which was exceeded.`stage`: The stage number exceeding the limit<br /><br /> |
-| `TooManyColumns` | Exceeded the number of columns for a stage. See the [Limits](#limits) table for the specific limit. | `numColumns`: The number of columns requested.<br /><br />`maxColumns`: The limit on columns which was exceeded. |
-| `TooManyWarnings` | Exceeded the allowed number of warnings of a particular type. | `rootErrorCode`: The error code corresponding to the exception that exceeded the required limit. <br /><br />`maxWarnings`: Maximum number of warnings that are allowed for the corresponding `rootErrorCode`. |
-| `TooManyWorkers` | Exceeded the supported number of workers running simultaneously. See the [Limits](#limits) table for the specific limit. | `workers`: The number of simultaneously running workers that exceeded a hard or soft limit. This may be larger than the number of workers in any one stage if multiple stages are running simultaneously. <br /><br />`maxWorkers`: The hard or soft limit on workers that was exceeded. |
-| `NotEnoughMemory` | Insufficient memory to launch a stage. | `serverMemory`: The amount of memory available to a single process.<br /><br />`serverWorkers`: The number of workers running in a single process.<br /><br />`serverThreads`: The number of threads in a single process. |
-| `WorkerFailed` | A worker task failed unexpectedly. | `errorMsg`<br /><br />`workerTaskId`: The ID of the worker task. |
-| `WorkerRpcFailed` | A remote procedure call to a worker task failed and could not recover. | `workerTaskId`: the id of the worker task |
-| `UnknownError` | All other errors. | `message` |
+| <a name="error_BroadcastTablesTooLarge">`BroadcastTablesTooLarge`</a> | The size of the broadcast tables used in the right hand side of the join exceeded the memory reserved for them in a worker task.<br /><br />Try increasing the peon memory or reducing the size of the broadcast tables. | `maxBroadcastTablesSize`: Memory reserved for the broadcast tables, measured in bytes. |
+| <a name="error_Canceled">`Canceled`</a> | The query was canceled. Common reasons for cancellation:<br /><br /><ul><li>User-initiated shutdown of the controller task via the `/druid/indexer/v1/task/{taskId}/shutdown` API.</li><li>Restart or failure of the server process that was running the controller task.</li></ul>| |
+| <a name="error_CannotParseExternalData">`CannotParseExternalData`</a> | A worker task could not parse data from an external datasource. | `errorMessage`: More details on why parsing failed. |
+| <a name="error_ColumnNameRestricted">`ColumnNameRestricted`</a> | The query uses a restricted column name. | `columnName`: The restricted column name. |
+| <a name="error_ColumnTypeNotSupported">`ColumnTypeNotSupported`</a> | The column type is not supported. This can be because:<br /> <br /><ul><li>Support for writing or reading from a particular column type is not supported.</li><li>The query attempted to use a column type that is not supported by the frame format. This occurs with ARRAY types, which are not yet implemented for frames.</li></ul> | `columnName`: The column name with an unsupported type.<br /> <br />`columnType`: The unknown column type. |
+| <a name="error_InsertCannotAllocateSegment">`InsertCannotAllocateSegment`</a> | The controller task could not allocate a new segment ID due to conflict with existing segments or pending segments. Common reasons for such conflicts:<br /> <br /><ul><li>Attempting to mix different granularities in the same intervals of the same datasource.</li><li>Prior ingestions that used non-extendable shard specs.</li></ul>| `dataSource`<br /> <br />`interval`: The interval for the attempted new segment allocation. |
+| <a name="error_InsertCannotBeEmpty">`InsertCannotBeEmpty`</a> | An INSERT or REPLACE query did not generate any output rows in a situation where output rows are required for success. This can happen for INSERT or REPLACE queries with `PARTITIONED BY` set to something other than `ALL` or `ALL TIME`. | `dataSource` |
+| <a name="error_InsertCannotOrderByDescending">`InsertCannotOrderByDescending`</a> | An INSERT query contained a `CLUSTERED BY` expression in descending order. Druid's segment generation code only supports ascending order. | `columnName` |
+| <a name="error_InsertCannotReplaceExistingSegment">`InsertCannotReplaceExistingSegment`</a> | A REPLACE query cannot proceed because an existing segment partially overlaps those bounds, and the portion within the bounds is not fully overshadowed by query results. <br /> <br />There are two ways to address this without modifying your query:<ul><li>Shrink the OVERLAP filter to match the query results.</li><li>Expand the OVERLAP filter to fully contain the existing segment.</li></ul>| `segmentId`: The existing segment <br />
+| <a name="error_InsertLockPreempted">`InsertLockPreempted`</a> | An INSERT or REPLACE query was canceled by a higher-priority ingestion job, such as a real-time ingestion task. | |
+| <a name="error_InsertTimeNull">`InsertTimeNull`</a> | An INSERT or REPLACE query encountered a null timestamp in the `__time` field.<br /><br />This can happen due to using an expression like `TIME_PARSE(timestamp) AS __time` with a timestamp that cannot be parsed. (TIME_PARSE returns null when it cannot parse a timestamp.) In this case, try parsing your timestamps using a different function or pattern.<br /><br />If your timestamps may genuinely be null, consider using COALESCE to provide a default value. One option is CURRENT_TIMESTAMP, which represents the start time of the job. |
+| <a name="error_InsertTimeOutOfBounds">`InsertTimeOutOfBounds`</a> | A REPLACE query generated a timestamp outside the bounds of the TIMESTAMP parameter for your OVERWRITE WHERE clause.<br /> <br />To avoid this error, verify that the you specified is valid. | `interval`: time chunk interval corresponding to the out-of-bounds timestamp |
+| <a name="error_InvalidNullByte">`InvalidNullByte`</a> | A string column included a null byte. Null bytes in strings are not permitted. | `column`: The column that included the null byte |
+| <a name="error_QueryNotSupported">`QueryNotSupported`</a> | QueryKit could not translate the provided native query to a multi-stage query.<br /> <br />This can happen if the query uses features that aren't supported, like GROUPING SETS. | |
+| <a name="error_RowTooLarge">`RowTooLarge`</a> | The query tried to process a row that was too large to write to a single frame. See the [Limits](#limits) table for specific limits on frame size. Note that the effective maximum row size is smaller than the maximum frame size due to alignment considerations during frame writing. | `maxFrameSize`: The limit on the frame size. |
+| <a name="error_TaskStartTimeout">`TaskStartTimeout`</a> | Unable to launch all the worker tasks in time. <br /> <br />There might be insufficient available slots to start all the worker tasks simultaneously.<br /> <br /> Try splitting up the query into smaller chunks with lesser `maxNumTasks` number. Another option is to increase capacity. | `numTasks`: The number of tasks attempted to launch. |
+| <a name="error_TooManyBuckets">`TooManyBuckets`</a> | Exceeded the maximum number of partition buckets for a stage (5,000 partition buckets).<br />< br />Partition buckets are created for each [`PARTITIONED BY`](#partitioned-by) time chunk for INSERT and REPLACE queries. The most common reason for this error is that your `PARTITIONED BY` is too narrow relative to your data. | `maxBuckets`: The limit on partition buckets. |
+| <a name="error_TooManyInputFiles">`TooManyInputFiles`</a> | Exceeded the maximum number of input files or segments per worker (10,000 files or segments).<br /><br />If you encounter this limit, consider adding more workers, or breaking up your query into smaller queries that process fewer files or segments per query. | `numInputFiles`: The total number of input files/segments for the stage.<br /><br />`maxInputFiles`: The maximum number of input files/segments per worker per stage.<br /><br />`minNumWorker`: The minimum number of workers required for a successful run. |
+| <a name="error_TooManyPartitions">`TooManyPartitions`</a> | Exceeded the maximum number of partitions for a stage (25,000 partitions).<br /><br />This can occur with INSERT or REPLACE statements that generate large numbers of segments, since each segment is associated with a partition. If you encounter this limit, consider breaking up your INSERT or REPLACE statement into smaller statements that process less data per statement. | `maxPartitions`: The limit on partitions which was exceeded |
+| <a name="error_TooManyClusteredByColumns">`TooManyClusteredByColumns`</a>  | Exceeded the maximum number of clustering columns for a stage (1,500 columns).<br /><br />This can occur with `CLUSTERED BY`, `ORDER BY`, or `GROUP BY` with a large number of columns. | `numColumns`: The number of columns requested.<br /><br />`maxColumns`: The limit on columns which was exceeded.`stage`: The stage number exceeding the limit<br /><br /> |
+| <a name="error_TooManyColumns">`TooManyColumns`</a> | Exceeded the maximum number of columns for a stage (2,000 columns). | `numColumns`: The number of columns requested.<br /><br />`maxColumns`: The limit on columns which was exceeded. |
+| <a name="error_TooManyWarnings">`TooManyWarnings`</a> | Exceeded the maximum allowed number of warnings of a particular type. | `rootErrorCode`: The error code corresponding to the exception that exceeded the required limit. <br /><br />`maxWarnings`: Maximum number of warnings that are allowed for the corresponding `rootErrorCode`. |
+| <a name="error_TooManyWorkers">`TooManyWorkers`</a> | Exceeded the maximum number of simultaneously-running workers. See the [Limits](#limits) table for more details. | `workers`: The number of simultaneously running workers that exceeded a hard or soft limit. This may be larger than the number of workers in any one stage if multiple stages are running simultaneously. <br /><br />`maxWorkers`: The hard or soft limit on workers that was exceeded. If this is lower than the hard limit (1,000 workers), then you can increase the limit by adding more memory to each task. |
+| <a name="error_NotEnoughMemory">`NotEnoughMemory`</a> | Insufficient memory to launch a stage. | `serverMemory`: The amount of memory available to a single process.<br /><br />`serverWorkers`: The number of workers running in a single process.<br /><br />`serverThreads`: The number of threads in a single process. |
+| <a name="error_WorkerFailed">`WorkerFailed`</a> | A worker task failed unexpectedly. | `errorMsg`<br /><br />`workerTaskId`: The ID of the worker task. |
+| <a name="error_WorkerRpcFailed">`WorkerRpcFailed`</a> | A remote procedure call to a worker task failed and could not recover. | `workerTaskId`: the id of the worker task |
+| <a name="error_UnknownError">`UnknownError`</a> | All other errors. | `message` |
diff --git a/docs/operations/auth-ldap.md b/docs/operations/auth-ldap.md
index b9603a0c38fd..5a2d8b7e292f 100644
--- a/docs/operations/auth-ldap.md
+++ b/docs/operations/auth-ldap.md
@@ -1,6 +1,7 @@
 ---
 id: auth-ldap
-title: "LDAP auth"
+title: "Configure LDAP authentication"
+sidebar_label: "LDAP auth"
 ---
 
 <!--
@@ -22,182 +23,284 @@ title: "LDAP auth"
   ~ under the License.
   -->
 
+You can use [Lightweight Directory Access Protocol (LDAP)](https://en.wikipedia.org/wiki/Lightweight_Directory_Access_Protocol) to secure access to Apache Druid. This topic describes how to set up Druid authentication and authorization with LDAP and LDAP over TLS (LDAPS). The examples on this page show the configuration for an Active Directory LDAP system.
 
-This page describes how to set up Druid user authentication and authorization through LDAP. The first step is to enable LDAP authentication and authorization for Druid. You then map an LDAP group to roles and assign permissions to roles.
+The first step is to enable LDAP authentication and authorization for Druid. You then map an LDAP group to Druid roles and assign permissions to those roles. After you've completed this configuration you can optionally choose to enable LDAPS to make LDAP traffic confidential and secure.
 
-## Enable LDAP in Druid
+## Prerequisites
 
-Before starting, verify that the active directory is reachable from the Druid Master servers. Command line tools such as `ldapsearch` and `ldapwhoami`, which are included with OpenLDAP, are useful for this testing. 
+Before you start to configure LDAP for Druid, test your LDAP connection and perform a sample search.
 
-### Check the connection
+### Check your LDAP connection
 
-First test that the basic connection and user credential works. For example, given a user `uuser1@example.com`, try:
+Test your LDAP connection to verify it works with user credentials. Later in the process you [configure Druid for LDAP authentication](#configure-druid-for-ldap-authentication) with this user as the `bindUser`.
+
+The following example command tests the connection for the user `myuser@example.com`. Insert your LDAP server IP address. Modify the port number of your LDAP instance if it listens on a port other than `389`.
 
 ```bash
-ldapwhoami -vv -H ldap://<ip_address>:389  -D"uuser1@example.com" -W
+ldapwhoami -vv -H ldap://ip_address:389  -D "myuser@example.com" -W
 ```
 
-Enter the password associated with the user when prompted and verify that the command succeeded. If it didn't, try the following troubleshooting steps:  
+Enter the password for the user when prompted and verify that the command succeeded. If it failed, check the following:
+
+- Make sure you're using the correct port for your LDAP instance.
+- Check if a network firewall is preventing connections to the LDAP port.
+- Review your LDAP implementation details to see whether you need to specifically allow LDAP clients at the LDAP server. If so, add the Druid Coordinator server to the allow list.
 
-* Verify that you've used the correct port for your LDAP instance. By default, the LDAP port is 389, but double-check with your LDAP admin if unable to connect. 
-* Check whether a network firewall is not preventing connections to the LDAP port.
-* Check whether LDAP clients need to be specifically whitelisted at the LDAP server to be able to reach it. If so, add the Druid Coordinator server to the AD whitelist. 
+### Test your LDAP search
 
+Once your LDAP connection is working, search for a user. For example, the following command searches for the user `myuser` in an Active Directory system. The `sAMAccountName` attribute is specific to Active Directory and contains the authenticated user identity:
 
-### Check the search criteria
+```bash
+ldapsearch -x -W -H ldap://ip_address:389  -D "cn=admin,dc=example,dc=com" -b "dc=example,dc=com" "(sAMAccountName=myuser)" +
+```
 
-After verifying basic connectivity, check your search criteria. For example, the command for searching for user `uuser1@example.com ` is as follows: 
+The `memberOf` attribute in the results shows the groups the user belongs to. For example, the following response shows that the user is a member of the `mygroup` group:
 
 ```bash
-ldapsearch -x -W -H ldap://<ldap_server>  -D"uuser1@example.com" -b "dc=example,dc=com" "(sAMAccountName=uuser1)"
+memberOf: cn=mygroup,ou=groups,dc=example,dc=com
 ```
 
-Note the `memberOf` attribute in the results; it shows the groups that the user belongs to. You will use this value to map the LDAP group to the Druid roles later. This attribute may be implemented differently on different types of LDAP servers. For instance, some LDAP servers may support recursive groupings, and some may not. Some LDAP server implementations may not have any object classes that contain this attribute altogether. If your LDAP server does not use the `memberOf` attribute, then Druid will not be able to determine a user's group membership using LDAP. The sAMAccountName attribute used in this example contains the authenticated user identity. This is an attribute of an object class specific to Microsoft Active Directory. The object classes and attribute used in your LDAP server may be different.
+You use this information to map the LDAP group to Druid roles in a later step. 
+
+> Druid uses the `memberOf` attribute to determine a group's membership using LDAP. If your LDAP server implementation doesn't include this attribute, you must complete some additional steps when you [map LDAP groups to Druid roles](#map-ldap-groups-to-druid-roles).
+
+## Configure Druid for LDAP authentication
+
+To configure Druid to use LDAP authentication, follow these steps. See [Configuration reference](../configuration/index.md) for the location of the configuration files. 
+
+1. Create a user in your LDAP system that you'll use both for internal communication with Druid and as the LDAP initial admin user. See [Security overview](./security-overview.md) for more information.
+In the example below, the LDAP user is `internal@example.com`.
 
-## Configure Druid user authentication with LDAP/Active Directory 
+2. Enable the `druid-basic-security` extension in the `common.runtime.properties` file.
 
-1. Enable the `druid-basic-security` extension in the `common.runtime.properties` file. See [Security Overview](security-overview.md) for details.   
-2. As a best practice, create a user in LDAP to be used for internal communication with Druid. 
-3. In `common.runtime.properties`, update LDAP-related properties, as shown in the following listing: 
-	```
-	druid.auth.authenticatorChain=["ldap"]
-	druid.auth.authenticator.ldap.type=basic
-	druid.auth.authenticator.ldap.enableCacheNotifications=true
-	druid.auth.authenticator.ldap.credentialsValidator.type=ldap
-	druid.auth.authenticator.ldap.credentialsValidator.url=ldap://<AD host>:<AD port>
-	druid.auth.authenticator.ldap.credentialsValidator.bindUser=<AD admin user, e.g.: Administrator@example.com>
-	druid.auth.authenticator.ldap.credentialsValidator.bindPassword=<AD admin password>
-	druid.auth.authenticator.ldap.credentialsValidator.baseDn=<base dn, e.g.: dc=example,dc=com>
-	druid.auth.authenticator.ldap.credentialsValidator.userSearch=<The LDAP search, e.g.: (&(sAMAccountName=%s)(objectClass=user))>
-	druid.auth.authenticator.ldap.credentialsValidator.userAttribute=sAMAccountName
-	druid.auth.authenticator.ldap.authorizerName=ldapauth
-	druid.escalator.type=basic
-	druid.escalator.internalClientUsername=<AD internal user, e.g.: internal@example.com>
-	druid.escalator.internalClientPassword=Welcome123
-	druid.escalator.authorizerName=ldapauth
-	druid.auth.authorizers=["ldapauth"]
-	druid.auth.authorizer.ldapauth.type=basic
-	druid.auth.authorizer.ldapauth.initialAdminUser=AD user who acts as the initial admin user, e.g.: internal@example.com>
-	druid.auth.authorizer.ldapauth.initialAdminRole=admin
-	druid.auth.authorizer.ldapauth.roleProvider.type=ldap
+3. In the `common.runtime.properties` file, add the following lines for LDAP properties and substitute the values for your own. See [Druid basic security](../development/extensions-core/druid-basic-security.md#properties-for-ldap-user-authentication) for details about these properties.
+ 
+   ```
+   druid.auth.authenticatorChain=["ldap"]
+   druid.auth.authenticator.ldap.type=basic
+   druid.auth.authenticator.ldap.enableCacheNotifications=true
+   druid.auth.authenticator.ldap.credentialsValidator.type=ldap
+   druid.auth.authenticator.ldap.credentialsValidator.url=ldap://ip_address:port
+   druid.auth.authenticator.ldap.credentialsValidator.bindUser=administrator@example.com
+   druid.auth.authenticator.ldap.credentialsValidator.bindPassword=adminpassword
+   druid.auth.authenticator.ldap.credentialsValidator.baseDn=dc=example,dc=com
+   druid.auth.authenticator.ldap.credentialsValidator.userSearch=(&(sAMAccountName=%s)(objectClass=user))
+   druid.auth.authenticator.ldap.credentialsValidator.userAttribute=sAMAccountName
+   druid.auth.authenticator.ldap.authorizerName=ldapauth
+   druid.escalator.type=basic
+   druid.escalator.internalClientUsername=internal@example.com
+   druid.escalator.internalClientPassword=internaluserpassword
+   druid.escalator.authorizerName=ldapauth
+   druid.auth.authorizers=["ldapauth"]
+   druid.auth.authorizer.ldapauth.type=basic
+   druid.auth.authorizer.ldapauth.initialAdminUser=internal@example.com
+   druid.auth.authorizer.ldapauth.initialAdminRole=admin
+   druid.auth.authorizer.ldapauth.roleProvider.type=ldap
    ```
+   Note the following:
 
-   Notice that the LDAP user created in the previous step, `internal@example.com`, serves as the internal client user and the initial admin user.
+   - `bindUser`: A user for connecting to LDAP. This should be the same user you used to [test your LDAP search](#test-your-ldap-search).
+   - `userSearch`: Your LDAP search syntax.
+   - `userAttribute`: The user search attribute.
+   - `internal@example.com` is the LDAP user you created in step 1. In the example it serves as both the internal client user and the initial admin user.
 
-## Use LDAP groups to assign roles
+   > In the above example, the [Druid escalator](../development/extensions-core/druid-basic-security.md#escalator) and LDAP initial admin user are set to the same user - `internal@example.com`. If the escalator is set to a different user, you must follow steps 4 and 5 to create the group mapping and allocate initial roles before the rest of the cluster can function.
 
-You can map LDAP groups to a role in Druid. Members in the group get access to the permissions of the corresponding role. 
+4. Save your group mapping to a JSON file. An example file `groupmap.json` looks like this:
+   
+   ```
+   {
+      "name": "mygroupmap",
+      "groupPattern": "CN=mygroup,CN=Users,DC=example,DC=com",
+      "roles": [
+         "readRole"
+      ]
+   }
+   ```
+   In the example, the LDAP group `mygroup` maps to Druid role `readRole` and the name of the mapping is `mygroupmap`.
 
+5. Use the Druid API to create the group mapping and allocate initial roles according to your JSON file. The following example uses curl to create the mapping defined in `groupmap.json` for the LDAP group `mygroup`:
+   
+   ```
+   curl -i -v  -H "Content-Type: application/json" -u internal -X POST -d @groupmap.json http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/mygroupmap
+   ```
+6. Check that the group mapping was created successfully. The following example request lists all group mappings:
 
-### Step 1: Create a role 
+   ```
+   curl -i -v  -H "Content-Type: application/json" -u internal -X GET  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings
+   ```
 
-First create the role in Druid using the Druid REST API.
+## Map LDAP groups to Druid roles
 
-Creating a role involves submitting a POST request to the Coordinator process. 
+Once you've completed the initial setup and mapping, you can map more LDAP groups to Druid roles. Members of an LDAP group get access to the permissions of the corresponding Druid role.
 
-The following REST APIs to create the role to read access for datasource, config, state.
+### Create a Druid role
 
-> As mentioned, the REST API calls need to address the Coordinator node. The examples used below use localhost as the Coordinator host and 8081 as the port. Adjust these settings according to your deployment.
+To create a Druid role, you can submit a POST request to the Coordinator process using the Druid REST API or you can use the Druid console.
 
-Call the following API to create role `readRole` . 
+The examples below use `localhost` as the Coordinator host and `8081` as the port. Amend these properties according to the details of your deployment. 
+
+Example request to create a role named `readRole`:
 
 ```
-curl -i -v  -H "Content-Type: application/json" -u internal -X POST  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/roles/readRole 
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/roles/readRole 
 ```
 
-Check that the role has been created successfully by entering the following:
+Check that Druid created the role successfully. The following example request lists all roles:
 
 ```
-curl -i -v  -H "Content-Type: application/json" -u internal -X GET  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/roles
+curl -i -v  -H "Content-Type: application/json" -u internal -X GET  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/roles
 ```
 
+### Add permissions to the Druid role
 
-### Step 2: Add permissions to a role 
-
-You can now add one or more permission to the role. The following example adds read-only access to a `wikipedia` data source.  
+Once you have a Druid role you can add permissions to it. The following example adds read-only access to a `wikipedia` data source.
 
 Given the following JSON in a file named `perm.json`:
 
 ```
-[{ "resource": { "name": "wikipedia", "type": "DATASOURCE" }, "action": "READ" }
-,{ "resource": { "name": ".*", "type": "STATE" }, "action": "READ" },
-{ "resource": {"name": ".*", "type": "CONFIG"}, "action": "READ"}]
-```
-
-The following command associates the permissions in the JSON file with the role 
-
-```
-curl -i -v  -H "Content-Type: application/json" -u internal -X POST -d@perm.json  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/roles/readRole/permissions
+[
+	{ "resource": { "name": "wikipedia", "type": "DATASOURCE" }, "action": "READ" },
+    { "resource": { "name": ".*", "type": "STATE" }, "action": "READ" },
+	{ "resource": {"name": ".*", "type": "CONFIG"}, "action": "READ"}
+]
 ```
 
-Note that the STATE and CONFIG permissions in `perm.json` are needed to see the data source in the web console. If only querying permissions are needed, the READ action is sufficient:
+The following request associates the permissions in the JSON file with the `readRole` role:
 
 ```
-[{ "resource": { "name": "wikipedia", "type": "DATASOURCE" }, "action": "READ" }]
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST -d@perm.json  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/roles/readRole/permissions
 ```
 
-You can also provide the name in the form of regular expression. For example, to give access to all data sources starting with `wiki`, specify the name as  `{ "name": "wiki.*", .....`. 
+Druid users need the `STATE` and `CONFIG` permissions to view the data source in the Druid console. If you only want to assign querying permissions you can apply just the `READ` permission with the first line in the `perm.json` file.
 
+You can also provide the data source name in the form of a regular expression. For example, to give access to all data sources starting with `wiki`, you would specify the data source name as `{ "name": "wiki.*" }` .
 
-### Step 3: Create group Mapping 
+### Create the group mapping
 
-The following shows an example of a group to role mapping. It assumes that a group named `group1` exists in the directory. Also assuming the following role mapping in a file named `groupmap.json`:
+You can now map an LDAP group to the Druid role. The following example request creates a mapping with name `mygroupmap`. It assumes that a group named `mygroup` exists in the directory.
 
 ```
 {
-    "name": "group1map",
-    "groupPattern": "CN=group1,CN=Users,DC=example,DC=com",
-    "roles": [
-        "readRole"
-    ]
+    "name": "mygroupmap",
+    "groupPattern": "CN=mygroup,CN=Users,DC=example,DC=com",
+    "roles": [
+        "readRole"
+    ]
 }
 ```
 
-You can configure the mapping as follows:
+The following example request configures the mapping&mdash;the role mapping is in the file `groupmap.json`. See [Configure Druid for LDAP authentication](#configure-druid-for-ldap-authentication) for the contents of an example file.
 
 ```
-curl -i -v  -H "Content-Type: application/json" -u internal -X POST -d @groupmap.json http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/group1map
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST -d @groupmap.json http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/mygroupmap
 ```
 
-To check whether the group mapping was created successfully, run the following command:
+To check whether the group mapping was created successfully, the following request lists all group mappings:
 
 ```
-curl -i -v  -H "Content-Type: application/json" -u internal -X GET http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings
+curl -i -v  -H "Content-Type: application/json" -u internal -X GET http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings
 ```
 
-To check the details of a specific group mapping, use the following:
+The following example request returns the details of the `mygroupmap` group:
 
 ```
-curl -i -v  -H "Content-Type: application/json" -u internal -X GET http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/group1map
+curl -i -v  -H "Content-Type: application/json" -u internal -X GET http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/mygroupmap
 ```
 
-To add additional roles to the group mapping, use the following API:
+The following example request adds the role `queryRole` to the `mygroupmap` mapping:
 
 ```
-curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/group1/roles/<newrole> 
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/mygroup/roles/queryrole
 ```
 
-In the next two steps you will be creating a user, and assigning previously created roles to it. These steps are only needed in the following cases: 
-                                                                                                 
- - Your LDAP server does not support the `memberOf` attribute, or 
- - You want to configure a user with additional roles that are not mapped to the group(s) that the user is a member of
- 
- If this is not the case for your scenario, you can skip these steps.
+### Add an LDAP user to Druid and assign a role
 
-### Step 4. Create a user
+You only need to complete this step if:
+- Your LDAP user doesn't belong to any of your LDAP groups, or
+- You want to configure a user with additional Druid roles that are not mapped to the LDAP groups that the user belongs to.
 
-Once LDAP is enabled, only user passwords are verified with LDAP. You add the LDAP user to Druid as follows: 
+Example request to add the LDAP user `myuser` to Druid:
 
 ```
-curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authentication/db/ldap/users/<AD user> 
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authentication/db/ldap/users/myuser 
 ```
 
-### Step 5. Assign the role to the user 
-
-The following command shows how to assign a role to a user:
+Example request to assign the `myuser` user to the `queryRole` role:
 
 ```
-curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/users/<AD user>/roles/<rolename> 
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authentication/db/ldap/users/myuser/roles/queryRole
 ```
 
-For more information about security and the basic security extension, see [Security Overview](security-overview.md). 
+## Enable LDAP over TLS (LDAPS)
+
+Once you've configured LDAP authentication in Druid, you can optionally make LDAP traffic confidential and secure by using Transport Layer Security (TLS)&mdash;previously Secure Socket Layer(SSL)&mdash;technology. 
+
+Configuring LDAPS establishes trust between Druid and the LDAP server.
+
+## Prerequisites
+
+Before you start to set up LDAPS in Druid, you must [configure Druid for LDAP authentication](#configure-druid-for-ldap-authentication). You also need:
+
+- A certificate issued by a public certificate authority (CA) or a self-signed certificate by an internal CA.
+- The root certificate for the CA that signed the certificate for the LDAP server. If you're using a common public CA, the certificate may already be in the Java truststore. Otherwise you need to import the certificate for the CA.
+
+## Configure Druid for LDAPS
+
+Complete the following steps to set up LDAPS for Druid. See [Configuration reference](../configuration/index.md) for the location of the configuration files. 
+
+1. Import the CA certificate for your LDAP server or a self-signed certificate into the truststore location saved as `druid.client.https.trustStorePath` in your `common.runtime.properties` file.
+
+   ```
+   keytool -import -trustcacerts -keystore path/to/cacerts -storepass truststorepassword -alias aliasName -file path/to/certificate.cer
+   ```
+
+   Replace `path/to/cacerts` with the path to your truststore, `truststorepassword` with your truststore password, `aliasName` with an alias name for the keystore, and `path/to/certificate.cer` with the location and name of your certificate. For example:
+
+   ```
+   keytool -import -trustcacerts -keystore /Library/Java/JavaVirtualMachines/adoptopenjdk-8.jdk/Contents/Home/jre/lib/security/cacerts -storepass mypassword -alias myAlias -file /etc/ssl/certs/my-certificate.cer
+   ```
+
+2. If the root certificate for the CA isn't already in the Java truststore, import it:
+
+   ```
+   keytool -importcert -keystore path/to/cacerts -storepass truststorepassword -alias aliasName -file path/to/certificate.cer
+   ```
+
+   Replace `path/to/cacerts` with the path to your truststore, `truststorepassword` with your truststore password, `aliasName` with an alias name for the keystore, and `path/to/certificate.cer` with the location and name of your certificate. For example:
+	
+   ```
+   keytool -importcert -keystore /Library/Java/JavaVirtualMachines/adoptopenjdk-8.jdk/Contents/Home/jre/lib/security/cacerts -storepass mypassword -alias myAlias -file /etc/ssl/certs/my-certificate.cer
+   ```
+
+3. In your `common.runtime.properties` file, add the following lines to the LDAP configuration section, substituting your own truststore path and password:
+
+   ```
+   druid.auth.basic.ssl.trustStorePath=/Library/Java/JavaVirtualMachines/adoptopenjdk-8.jdk/Contents/Home/jre/lib/security/cacerts
+   druid.auth.basic.ssl.protocol=TLS
+   druid.auth.basic.ssl.trustStorePassword=xxxxxx
+   ```
+
+   See [Druid basic security](../development/extensions-core/druid-basic-security.md#properties-for-ldaps) for details about these properties.
+
+4. You can optionally configure additional LDAPS properties in the `common.runtime.properties` file. See [Druid basic security](../development/extensions-core/druid-basic-security.md#properties-for-ldaps) for more information.
+
+5. Restart Druid.
+
+
+## Troubleshooting tips
+
+The following are some ideas to help you troubleshoot issues with LDAP and LDAPS.
+
+### Check the coordinator logs
+
+If your LDAP connection isn't working, check the coordinator logs. See [Logging](../configuration/logging.md) for details.
+
+### Check the Druid escalator configuration
+
+If the coordinator is working but the rest of the cluster isn't, check the escalator configuration. See the [Configuration reference](../configuration/index.md) for details. You can also check other service logs to see why the services are unable to fetch authorization details from the coordinator.
+
+### Check your LDAP server response time
+
+If a user can log in to the Druid console but the landing page shows a 401 error, check your LDAP server response time. In a large organization with a high number of LDAP users, LDAP may be slow to respond, and this can result in a connection timeout.
diff --git a/docs/operations/metrics.md b/docs/operations/metrics.md
index 8822f3fea73d..4e3c961dcb8d 100644
--- a/docs/operations/metrics.md
+++ b/docs/operations/metrics.md
@@ -230,8 +230,14 @@ Note: If the JVM does not support CPU time measurement for the current thread, `
 |------|-----------|------------------------------------------------------------|------------|
 |`task/run/time`|Milliseconds taken to run a task.| `dataSource`, `taskId`, `taskType`, `taskStatus`|Varies|
 |`task/pending/time`|Milliseconds taken for a task to wait for running.| `dataSource`, `taskId`, `taskType`|Varies|
-|`task/action/log/time`|Milliseconds taken to log a task action to the audit log.| `dataSource`, `taskId`, `taskType`|< 1000 (subsecond)|
-|`task/action/run/time`|Milliseconds taken to execute a task action.| `dataSource`, `taskId`, `taskType`|Varies from subsecond to a few seconds, based on action type.|
+|`task/action/log/time`|Milliseconds taken to log a task action to the audit log.| `dataSource`, `taskId`, `taskType`, `taskActionType`|< 1000 (subsecond)|
+|`task/action/run/time`|Milliseconds taken to execute a task action.| `dataSource`, `taskId`, `taskType`, `taskActionType`|Varies from subsecond to a few seconds, based on action type.|
+|`task/action/success/count`|Number of task actions that were executed successfully during the emission period. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskId`, `taskType`, `taskActionType`|Varies|
+|`task/action/failed/count`|Number of task actions that failed during the emission period. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskId`, `taskType`, `taskActionType`|Varies|
+|`task/action/batch/queueTime`|Milliseconds spent by a batch of task actions in queue. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskActionType`, `interval`|Varies based on the `batchAllocationWaitTime` and number of batches in queue.|
+|`task/action/batch/runTime`|Milliseconds taken to execute a batch of task actions. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskActionType`, `interval`|Varies from subsecond to a few seconds, based on action type and batch size.|
+|`task/action/batch/size`|Number of task actions in a batch that was executed during the emission period. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskActionType`, `interval`|Varies based on number of concurrent task actions.|
+|`task/action/batch/attempts`|Number of execution attempts for a single batch of task actions. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskActionType`, `interval`|1 if there are no failures or retries.|
 |`segment/added/bytes`|Size in bytes of new segments created.| `dataSource`, `taskId`, `taskType`, `interval`|Varies|
 |`segment/moved/bytes`|Size in bytes of segments moved/archived via the Move Task.| `dataSource`, `taskId`, `taskType`, `interval`|Varies|
 |`segment/nuked/bytes`|Size in bytes of segments deleted via the Kill Task.| `dataSource`, `taskId`, `taskType`, `interval`|Varies|
diff --git a/docs/operations/python.md b/docs/operations/python.md
new file mode 100644
index 000000000000..9f5b9c34909e
--- /dev/null
+++ b/docs/operations/python.md
@@ -0,0 +1,49 @@
+---
+id: python
+title: "Python Installation"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid startup script requires Python2 or Python3 interpreter. 
+Since Python2 is deprecated, this document has instructions to install Python3 interpreter.
+
+## Python3 interpreter installation instructions
+
+### Linux
+
+#### Debian or Ubuntu
+    - `sudo apt update`
+    - `sudo apt install -y python3-pip`
+#### RHEL
+    - `sudo yum install -y epel-release`
+    - `sudo yum install -y python3-pip`
+
+### MacOS
+
+#### Install with Homebrew
+Refer [Installing Python 3 on Mac OS X](https://docs.python-guide.org/starting/install3/osx/)
+
+#### Install the official Python release
+* Browse to the [Python Downloads Page](https://www.python.org/downloads/) and download the latest version (3.x.x)
+
+Verify if Python3 is installed by issuing `python3 --version` command.
+
+
diff --git a/docs/operations/security-overview.md b/docs/operations/security-overview.md
index 028cff04f55a..3fa80e24adc2 100644
--- a/docs/operations/security-overview.md
+++ b/docs/operations/security-overview.md
@@ -250,80 +250,7 @@ The following steps walk through a sample setup procedure:
 
 ## Configuring an LDAP authenticator
 
-As an alternative to using the basic metadata authenticator, you can use LDAP to authenticate users. The following steps provide an overview of the setup procedure. For more information on these settings, see [Properties for LDAP user authentication](../development/extensions-core/druid-basic-security.md#properties-for-ldap-user-authentication).
-
-1. In `common.runtime.properties`, add LDAP to the authenticator chain in the order in which you want requests to be evaluated. For example:
-   ```
-   # Druid basic security
-   druid.auth.authenticatorChain=["ldap", "MyBasicMetadataAuthenticator"]
-   ```
-
-2. Configure LDAP settings in `common.runtime.properties` as appropriate for your LDAP scheme and system. For example:
-   ```
-   druid.auth.authenticator.ldap.type=basic
-   druid.auth.authenticator.ldap.enableCacheNotifications=true
-   druid.auth.authenticator.ldap.credentialsValidator.type=ldap
-   druid.auth.authenticator.ldap.credentialsValidator.url=ldap://ad_host:389
-   druid.auth.authenticator.ldap.credentialsValidator.bindUser=ad_admin_user
-   druid.auth.authenticator.ldap.credentialsValidator.bindPassword=ad_admin_password
-   druid.auth.authenticator.ldap.credentialsValidator.baseDn=dc=example,dc=com 
-   druid.auth.authenticator.ldap.credentialsValidator.userSearch=(&(sAMAccountName=%s)(objectClass=user))
-   druid.auth.authenticator.ldap.credentialsValidator.userAttribute=sAMAccountName
-   druid.auth.authenticator.ldap.authorizerName=ldapauth
-   druid.escalator.type=basic
-   druid.escalator.internalClientUsername=ad_interal_user
-   druid.escalator.internalClientPassword=Welcome123
-   druid.escalator.authorizerName=ldapauth
-   druid.auth.authorizers=["ldapauth"]
-   druid.auth.authorizer.ldapauth.type=basic
-   druid.auth.authorizer.ldapauth.initialAdminUser=<ad_initial_admin_user>
-   druid.auth.authorizer.ldapauth.initialAdminRole=admin
-   druid.auth.authorizer.ldapauth.roleProvider.type=ldap
-   ```
-
-3. Use the Druid API to create the group mapping and allocate initial roles. For example, using curl and given a group named `group1` in the directory, run: 
-   ```
-   curl -i -v  -H "Content-Type: application/json" -u internal -X POST -d @groupmap.json http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/group1map
-   ```
-   The `groupmap.json` file contents would be something like:
-   ```
-   {
-     "name": "group1map",
-     "groupPattern": "CN=group1,CN=Users,DC=example,DC=com",
-     "roles": [
-         "readRole"
-     ]
-   }
-   ```
-4. Check if the group mapping is created successfully by executing the following API. This lists all group mappings.
-   ```
-   curl -i -v  -H "Content-Type: application/json" -u internal -X GET http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings
-   ```
-   
-   Alternatively, to check the details of a specific group mapping, use the following API:
-   ```
-   curl -i -v  -H "Content-Type: application/json" -u internal -X GET http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/group1map
-   ```
-   
-5. To add additional roles to the group mapping, use the following API: 
-   ``` 
-   curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/group1/roles/<newrole> 
-   ```
-
-6. Add the LDAP user to Druid. To add a user, use the following authentication API:
-   ```
-   curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authentication/db/ldap/users/<ad_user> 
-   ```
-
-7. Use the following command to assign the role to a user:
-   ```
-   curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/users/<ad_user>/roles/<rolename>
-   ```   
-
-
-
-Congratulations, you have configured permissions for user-assigned roles in Druid!
-
+As an alternative to using the basic metadata authenticator, you can use LDAP to authenticate users. See [Configure LDAP authentication](./auth-ldap.md) for information on configuring Druid for LDAP and LDAPS.
 
 ## Druid security trust model
 Within Druid's trust model there users can have different authorization levels:
diff --git a/docs/operations/single-server.md b/docs/operations/single-server.md
index 35413952e222..48459a286042 100644
--- a/docs/operations/single-server.md
+++ b/docs/operations/single-server.md
@@ -23,14 +23,17 @@ title: "Single server deployment"
   -->
 
 
-Druid includes a set of reference configurations and launch scripts for single-machine deployments:
-
-- `nano-quickstart`
-- `micro-quickstart`
-- `small`
-- `medium`
-- `large`
-- `xlarge`
+Druid includes a set of reference configurations and launch scripts for single-machine deployments.
+These configuration bundles are located in `conf/druid/single-server/`.
+
+The `auto` configuration sizes runtime parameters based on available processors and memory. Other configurations include hard-coded runtime parameters for various server sizes. Most users should stick with `auto`. Refer below [Druid auto start](#druid-auto-start)
+- `auto` (run script: `bin/start-druid`)
+- `nano-quickstart` (run script: `bin/start-nano-quickstart`)
+- `micro-quickstart` (run script: `bin/start-micro-quickstart`)
+- `small` (run script: `bin/start-single-server-small`)
+- `medium` (run script: `bin/start-single-server-medium`)
+- `large` (run script: `bin/start-single-server-large`)
+- `xlarge` (run script: `bin/start-single-server-xlarge`)
 
 The `micro-quickstart` is sized for small machines like laptops and is intended for quick evaluation use-cases.
 
@@ -44,6 +47,18 @@ The example configurations run the Druid Coordinator and Overlord together in a
 
 While example configurations are provided for very large single machines, at higher scales we recommend running Druid in a [clustered deployment](../tutorials/cluster.md), for fault-tolerance and reduced resource contention.
 
+## Druid auto start
+
+Druid includes a launch script, `bin/start-druid` that automatically sets various memory-related parameters based on available processors and memory. It accepts optional arguments such as list of services, total memory and a config directory to override default JVM arguments and service-specific runtime properties.
+
+`start-druid` is a generic launch script capable of starting any set of Druid services on a server.
+It accepts optional arguments such as list of services, total memory and a config directory to override default JVM arguments and service-specific runtime properties.
+Druid services will use all processors and up to 80% memory on the system.
+For details about possible arguments, run `bin/start-druid --help`.
+
+The corresponding launch scripts (e.g. `start-micro-quickstart`) are now deprecated.
+
+
 ## Single server reference configurations
 
 ### Nano-Quickstart: 1 CPU, 4GiB RAM
@@ -74,5 +89,4 @@ While example configurations are provided for very large single machines, at hig
 ### X-Large: 64 CPU, 512GiB RAM (~i3.16xlarge)
 
 - Launch command: `bin/start-xlarge`
-- Configuration directory: `conf/druid/single-server/xlarge`
-
+- Configuration directory: `conf/druid/single-server/xlarge`
\ No newline at end of file
diff --git a/docs/querying/lookups.md b/docs/querying/lookups.md
index 57b406afb199..860a3ed2e277 100644
--- a/docs/querying/lookups.md
+++ b/docs/querying/lookups.md
@@ -115,8 +115,8 @@ will not detect this automatically.
 
 Dynamic Configuration
 ---------------------
-> Dynamic lookup configuration is an [experimental](../development/experimental.md) feature. Static
-> configuration is no longer supported.
+> Static configuration is no longer supported.
+
 The following documents the behavior of the cluster-wide config which is accessible through the Coordinator.
 The configuration is propagated through the concept of "tier" of servers.
 A "tier" is defined as a group of services which should receive a set of lookups.
diff --git a/docs/querying/nested-columns.md b/docs/querying/nested-columns.md
index e8dc628c8fc5..77af91ddff89 100644
--- a/docs/querying/nested-columns.md
+++ b/docs/querying/nested-columns.md
@@ -23,17 +23,17 @@ sidebar_label: Nested columns
   ~ under the License.
   -->
 
-> Nested columns is an experimental feature available starting in Apache Druid 24.0. Like most experimental features, functionality documented on this page is subject to change in future releases. However, the COMPLEX column type includes versioning to provide backward compatible support in future releases. We strongly encourage you to experiment with nested columns in your development environment to evaluate that they meet your use case. If so, you can use them in production scenarios. Review the release notes and this page to stay up to date with changes.
-
 Apache Druid supports directly storing nested data structures in `COMPLEX<json>` columns. `COMPLEX<json>` columns store a copy of the structured data in JSON format and specialized internal columns and indexes for nested literal values&mdash;STRING, LONG, and DOUBLE types. An optimized [virtual column](./virtual-columns.md#nested-field-virtual-column) allows Druid to read and filter these values at speeds consistent with standard Druid LONG, DOUBLE, and STRING columns.
 
 Druid [SQL JSON functions](./sql-json-functions.md) allow you to extract, transform, and create `COMPLEX<json>` values in SQL queries, using the specialized virtual columns where appropriate. You can use the [JSON nested columns functions](../misc/math-expr.md#json-functions) in [native queries](./querying.md) using [expression virtual columns](./virtual-columns.md#expression-virtual-column), and in native ingestion with a [`transformSpec`](../ingestion/ingestion-spec.md#transformspec).
 
 You can use the JSON functions in INSERT and REPLACE statements in SQL-based ingestion, or in a `transformSpec` in native ingestion as an alternative to using a [`flattenSpec`](../ingestion/data-formats.md#flattenspec) object to "flatten" nested data for ingestion.
 
+Druid supports directly ingesting nested data with the following formats: JSON, Parquet, Avro, ORC.
+
 ## Example nested data
 
-The examples in this topic use the data in [`nested_example_data.json`](https://static.imply.io/data/nested_example_data.json). The file contains a simple facsimile of an order tracking and shipping table. 
+The examples in this topic use the JSON data in [`nested_example_data.json`](https://static.imply.io/data/nested_example_data.json). The file contains a simple facsimile of an order tracking and shipping table. 
 
 When pretty-printed, a sample row in `nested_example_data` looks like this:
 
@@ -63,7 +63,7 @@ When pretty-printed, a sample row in `nested_example_data` looks like this:
 
 ## Native batch ingestion
 
-For native batch ingestion, you can use the [JSON nested columns functions](./sql-json-functions.md) to extract nested data as an alternative to using the [`flattenSpec`](../ingestion/data-formats.md#flattenspec) input format.
+For native batch ingestion, you can use the [SQL JSON functions](./sql-json-functions.md) to extract nested data as an alternative to using the [`flattenSpec`](../ingestion/data-formats.md#flattenspec) input format.
 
 To configure a dimension as a nested data type, specify the `json` type for the dimension in the `dimensions` list in the `dimensionsSpec` property of your ingestion spec.
 
@@ -124,7 +124,7 @@ For example, the following ingestion spec instructs Druid to ingest `shipTo` and
 
 ### Transform data during batch ingestion
 
-You can use the [JSON nested columns functions](./sql-json-functions.md) to transform JSON data and reference the transformed data in your ingestion spec. 
+You can use the [SQL JSON functions](./sql-json-functions.md) to transform nested data and reference the transformed data in your ingestion spec. 
 
 To do this, define the output name and expression in the `transforms` list in the `transformSpec` object of your ingestion spec.
 
@@ -192,7 +192,7 @@ For example, the following ingestion spec extracts `firstName`, `lastName` and `
 
 ## SQL-based ingestion
 
-To ingest nested data using multi-stage query architecture, specify `COMPLEX<json>` as the value for `type` when you define the row signature&mdash;`shipTo` and `details` in the following example ingestion spec:
+To ingest nested data using SQL-based ingestion, specify `COMPLEX<json>` as the value for `type` when you define the row signature&mdash;`shipTo` and `details` in the following example ingestion spec:
 
 ![SQL-based ingestion](../assets/nested-msq-ingestion.png)
 
@@ -297,7 +297,7 @@ The [Kafka tutorial](../tutorials/tutorial-kafka.md) guides you through the step
 
 ### Transform data during SQL-based ingestion
 
-You can use the [JSON nested columns functions](./sql-json-functions.md) to transform JSON data in your ingestion query.
+You can use the [SQL JSON functions](./sql-json-functions.md) to transform nested data in your ingestion query.
 
 For example, the following ingestion query is the SQL-based version of the [previous batch example](#transform-data-during-batch-ingestion)&mdash;it extracts `firstName`, `lastName`, and `address` from `shipTo` and creates a composite JSON object containing `product`, `details`, and `department`.
 
@@ -326,7 +326,7 @@ PARTITIONED BY ALL
 
 ## Ingest a JSON string as COMPLEX<json\>
 
-If your source data uses a string representation of your JSON column, you can still ingest the data as `COMPLEX<JSON>` as follows:
+If your source data contains serialized JSON strings, you can ingest the data as `COMPLEX<JSON>` as follows:
 - During native batch ingestion, call the `parse_json` function in a `transform` object in the `transformSpec`.
 - During SQL-based ingestion, use the PARSE_JSON keyword within your SELECT statement to transform the string values to JSON.
 - If you are concerned that your data may not contain valid JSON, you can use `try_parse_json` for native batch or `TRY_PARSE_JSON` for SQL-based ingestion. For cases where the column does not contain valid JSON, Druid inserts a null value.
@@ -563,7 +563,7 @@ In addition to `JSON_VALUE`, Druid offers a number of operators that focus on tr
 - `PARSE_JSON`
 - `TO_JSON_STRING`
 
-These functions are primarily intended for use with the multi-stage query architecture to transform data during insert operations, but they also work in traditional Druid SQL queries. Because most of these functions output JSON objects, they have the same limitations when used in traditional Druid queries as interacting with the JSON objects directly.
+These functions are primarily intended for use with SQL-based ingestion to transform data during insert operations, but they also work in traditional Druid SQL queries. Because most of these functions output JSON objects, they have the same limitations when used in traditional Druid queries as interacting with the JSON objects directly.
 
 #### Example query: Return results in a JSON object
 
@@ -663,7 +663,7 @@ Before you start using the nested columns feature, consider the following known
 - Directly using `COMPLEX<json>` columns and expressions is not well integrated into the Druid query engine. It can result in errors or undefined behavior when grouping and filtering, and when you use `COMPLEX<json>` objects as inputs to aggregators. As a workaround, consider using `TO_JSON_STRING` to coerce the values to strings before you perform these operations.
 - Directly using array-typed outputs from `JSON_KEYS` and `JSON_PATHS` is moderately supported by the Druid query engine. You can group on these outputs, and there are a number of array expressions that can operate on these values, such as `ARRAY_CONCAT_AGG`. However, some operations are not well defined for use outside array-specific functions, such as filtering using `=` or `IS NULL`.
 - Input validation for JSON SQL operators is currently incomplete, which sometimes results in undefined behavior or unhelpful error messages.
-- Ingesting JSON columns with a very complex nested structure is potentially an expensive operation and may require you to tune ingestion tasks and/or cluster parameters to account for increased memory usage or overall task run time. When you tune your ingestion configuration, treat each nested literal field inside a JSON object as a flattened top-level Druid column.
+- Ingesting data with a very complex nested structure is potentially an expensive operation and may require you to tune ingestion tasks and/or cluster parameters to account for increased memory usage or overall task run time. When you tune your ingestion configuration, treat each nested literal field inside an object as a flattened top-level Druid column.
 
 ## Further reading
 
diff --git a/docs/querying/sql-jdbc.md b/docs/querying/sql-jdbc.md
index 0f041c6fad38..a558637bc110 100644
--- a/docs/querying/sql-jdbc.md
+++ b/docs/querying/sql-jdbc.md
@@ -29,6 +29,12 @@ sidebar_label: "JDBC driver API"
 
 You can make [Druid SQL](./sql.md) queries using the [Avatica JDBC driver](https://calcite.apache.org/avatica/downloads/). We recommend using Avatica JDBC driver version 1.17.0 or later. Note that as of the time of this writing, Avatica 1.17.0, the latest version, does not support passing connection string parameters from the URL to Druid, so you must pass them using a `Properties` object. Once you've downloaded the Avatica client jar, add it to your classpath and use the connect string `jdbc:avatica:remote:url=http://BROKER:8082/druid/v2/sql/avatica/`.
 
+When using the JDBC connector for the [examples](#examples) or in general, it's helpful to understand the parts of the connect string stored in the `url` variable:
+
+  - `jdbc:avatica:remote:url=` is prepended to the hostname and port.
+  - The hostname and port number for your Druid deployment depends on whether you want to connect to the Router or a specific Broker. For more information, see [Connection stickiness](#connection-stickiness). In the case of the quickstart deployment, the hostname and port are `http://localhost:8888`, which connects to the Router running on your local machine.
+  - The SQL endpoint in Druid for the Avatica driver is  `/druid/v2/sql/avatica/`.
+
 Example code:
 
 ```java
@@ -51,6 +57,8 @@ try (Connection connection = DriverManager.getConnection(url, connectionProperti
 }
 ```
 
+For a runnable example that includes a query that you might run, see [Examples](#examples).
+
 It is also possible to use a protocol buffers JDBC connection with Druid, this offer reduced bloat and potential performance
 improvements for larger result sets. To use it apply the following connection url instead, everything else remains the same
 ```
@@ -60,12 +68,12 @@ String url = "jdbc:avatica:remote:url=http://localhost:8082/druid/v2/sql/avatica
 > The protobuf endpoint is also known to work with the official [Golang Avatica driver](https://github.com/apache/calcite-avatica-go)
 
 Table metadata is available over JDBC using `connection.getMetaData()` or by querying the
-["INFORMATION_SCHEMA" tables](sql-metadata-tables.md).
+["INFORMATION_SCHEMA" tables](sql-metadata-tables.md). For an example of this, see [Get the metadata for a datasource](#get-the-metadata-for-a-datasource).
 
 ## Connection stickiness
 
 Druid's JDBC server does not share connection state between Brokers. This means that if you're using JDBC and have
-multiple Druid Brokers, you should either connect to a specific Broker, or use a load balancer with sticky sessions
+multiple Druid Brokers, you should either connect to a specific Broker or use a load balancer with sticky sessions
 enabled. The Druid Router process provides connection stickiness when balancing JDBC requests, and can be used to achieve
 the necessary stickiness even with a normal non-sticky load balancer. Please see the
 [Router](../design/router.md) documentation for more details.
@@ -82,3 +90,112 @@ statement.setString(1, "abc");
 statement.setString(2, "def");
 final ResultSet resultSet = statement.executeQuery();
 ```
+
+## Examples
+
+<!-- docs/tutorial-jdbc.md redirects here -->
+
+The following section contains two complete samples that use the JDBC connector:
+
+- [Get the metadata for a datasource](#get-the-metadata-for-a-datasource) shows you how to query the `INFORMATION_SCHEMA` to get metadata like column names. 
+- [Query data](#query-data) runs a select query against the datasource.
+
+You can try out these examples after verifying that you meet the [prerequisites](#prerequisites).
+
+For more information about the connection options, see [Client Reference](https://calcite.apache.org/avatica/docs/client_reference.html).
+
+### Prerequisites 
+
+Make sure you meet the following requirements before trying these examples:
+
+- A supported Java version, such as Java 8
+
+- [Avatica JDBC driver](https://calcite.apache.org/avatica/downloads/). You can add the JAR  to your `CLASSPATH` directly or manage it externally, such as through Maven and a `pom.xml` file.
+
+- An available Druid instance. You can use the `micro-quickstart` configuration described in [Quickstart (local)](../tutorials/index.md). The examples assume that you are using the quickstart, so no authentication or authorization is expected unless explicitly mentioned. 
+
+- The example `wikipedia` datasource from the quickstart is loaded on your Druid instance. If you have a different datasource loaded, you can still try these examples. You'll have to update the table name and column names to match your datasource.
+
+### Get the metadata for a datasource
+
+Metadata, such as column names, is available either through the [`INFORMATION_SCHEMA`](../querying/sql-metadata-tables.md) table or through `connect.getMetaData()`. The following example uses the `INFORMATION_SCHEMA` table to retrieve and print the list of column names for the `wikipedia` datasource that you loaded during a previous tutorial.
+
+```java
+import java.sql.*;
+import java.util.Properties;
+
+public class JdbcListColumns {
+
+    public static void main(String args[]) throws SQLException
+    {
+        // Connect to /druid/v2/sql/avatica/ on your Router. 
+        // You can connect to a Broker but must configure connection stickiness if you do. 
+        String url = "jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica/";
+
+        String query = "SELECT COLUMN_NAME,* FROM INFORMATION_SCHEMA.COLUMNS WHERE TABLE_NAME = 'wikipedia' and TABLE_SCHEMA='druid'";
+        // Set any connection context parameters you need here
+        // Or leave empty for default behavior.
+        Properties connectionProperties = new Properties();
+
+        try (Connection connection = DriverManager.getConnection(url, connectionProperties)) {
+            try (
+                    final Statement statement = connection.createStatement();
+                    final ResultSet rs = statement.executeQuery(query)
+            ) {
+                while (rs.next()) {
+                    String columnName = rs.getString("COLUMN_NAME");
+                    System.out.println(columnName);
+                }
+            }
+        } catch (SQLException e) {
+            throw new RuntimeException(e);
+        }
+
+    }
+}
+```
+
+### Query data
+
+Now that you know what columns are available, you can start querying the data. The following example queries the datasource named `wikipedia` for the timestamps and comments from Japan. It also sets the [query context parameter](../querying/sql-query-context.md) `sqlTimeZone` . Optionally,  you can also parameterize queries by using [dynamic parameters](#dynamic-parameters).
+
+```java
+import java.sql.*;
+import java.util.Properties;
+
+public class JdbcCountryAndTime {
+
+    public static void main(String args[]) throws SQLException
+    {
+        // Connect to /druid/v2/sql/avatica/ on your Router. 
+        // You can connect to a Broker but must configure connection stickiness if you do. 
+        String url = "jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica/";
+
+        //The query you want to run.
+        String query = "SELECT __time, isRobot, countryName, comment FROM wikipedia WHERE countryName='Japan'";
+        // Set any connection context parameters you need here
+        // Or leave empty for default behavior.
+        Properties connectionProperties = new Properties();
+        connectionProperties.setProperty("sqlTimeZone", "America/Los_Angeles");
+
+        try (Connection connection = DriverManager.getConnection(url, connectionProperties)) {
+            try (
+                    final Statement statement = connection.createStatement();
+                    final ResultSet rs = statement.executeQuery(query)
+            ) {
+                while (rs.next()) {
+                    Timestamp timeStamp = rs.getTimestamp("__time");
+                    String comment = rs.getString("comment");
+                    System.out.println(timeStamp);
+                    System.out.println(comment);
+                }
+            }
+        } catch (SQLException e) {
+            throw new RuntimeException(e);
+        }
+
+    }
+}
+`````
+
+
diff --git a/docs/querying/sql-translation.md b/docs/querying/sql-translation.md
index d26ae6f0d276..370ad002c1cd 100644
--- a/docs/querying/sql-translation.md
+++ b/docs/querying/sql-translation.md
@@ -24,7 +24,7 @@ sidebar_label: "SQL query translation"
   -->
 
 > Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
-> This document describes the SQL language.
+> This document describes the Druid SQL language.
 
 Druid uses [Apache Calcite](https://calcite.apache.org/) to parse and plan SQL queries.
 Druid translates SQL statements into its [native JSON-based query language](querying.md).
@@ -34,8 +34,8 @@ This topic includes best practices and tools to help you achieve good performanc
 
 ## Best practices
 
-Consider this (non-exhaustive) list of things to look out for when looking into the performance implications of
-how your SQL queries are translated to native queries.
+Consider the following non-exhaustive list of best practices when looking into performance implications of
+translating Druid SQL queries to native queries.
 
 1. If you wrote a filter on the primary time column `__time`, make sure it is being correctly translated to an
 `"intervals"` filter, as described in the [Time filters](#time-filters) section below. If not, you may need to change
@@ -241,10 +241,9 @@ enabling logging and running this query, we can see that it actually runs as the
 
 Druid SQL uses four different native query types.
 
-- [Scan](scan-query.md) is used for queries that do not aggregate (no GROUP BY, no DISTINCT).
+- [Scan](scan-query.md) is used for queries that do not aggregate&mdash;no GROUP BY, no DISTINCT.
 
-- [Timeseries](timeseriesquery.md) is used for queries that GROUP BY `FLOOR(__time TO unit)` or `TIME_FLOOR(__time,
-period)`, have no other grouping expressions, no HAVING or LIMIT clauses, no nesting, and either no ORDER BY, or an
+- [Timeseries](timeseriesquery.md) is used for queries that GROUP BY `FLOOR(__time TO unit)` or `TIME_FLOOR(__time, period)`, have no other grouping expressions, no HAVING clause, no nesting, and either no ORDER BY, or an
 ORDER BY that orders by same expression as present in GROUP BY. It also uses Timeseries for "grand total" queries that
 have aggregation functions but no GROUP BY. This query type takes advantage of the fact that Druid segments are sorted
 by time.
diff --git a/docs/tutorials/cluster.md b/docs/tutorials/cluster.md
index b61953c2f427..5ee68e2cd13e 100644
--- a/docs/tutorials/cluster.md
+++ b/docs/tutorials/cluster.md
@@ -130,7 +130,10 @@ The [basic cluster tuning guide](../operations/basic-cluster-tuning.md) has info
 
 ## Select OS
 
-We recommend running your favorite Linux distribution. You will also need [Java 8 or 11](../operations/java.md).
+We recommend running your favorite Linux distribution. You will also need 
+
+* [Java 8 or 11](../operations/java.md).
+* [Python2 or Python3](../operations/python.md)  
 
 > If needed, you can specify where to find Java using the environment variables
 > `DRUID_JAVA_HOME` or `JAVA_HOME`. For more details run the `bin/verify-java` script.
diff --git a/docs/tutorials/index.md b/docs/tutorials/index.md
index 7d3d2ab68ec1..d854a691e6b9 100644
--- a/docs/tutorials/index.md
+++ b/docs/tutorials/index.md
@@ -22,8 +22,7 @@ title: "Quickstart (local)"
   ~ under the License.
   -->
 
-
-This quickstart gets you started with Apache Druid using the [`micro-quickstart`](../operations/single-server.md#micro-quickstart-4-cpu-16gib-ram) configuration, and introduces you to Druid ingestion and query features.
+This quickstart gets you started with Apache Druid and introduces you to Druid ingestion and query features. For this tutorial, we recommend a machine with at least 6 GB of RAM.
 
 In this quickstart, you'll do the following:
 - install Druid
@@ -37,15 +36,16 @@ Druid supports a variety of ingestion options. Once you're done with this tutori
 
 You can follow these steps on a relatively modest machine, such as a workstation or virtual server with 16 GiB of RAM.
 
-Druid comes equipped with several [startup configuration profiles](../operations/single-server.md) for a
-range of machine sizes. These range from `nano` (1 CPU, 4GiB RAM) to `x-large` (64 CPU, 512GiB RAM). For more
-information, see [Single server deployment](../operations/single-server.md). For information on deploying Druid services
-across clustered machines, see [Clustered deployment](./cluster.md).
+Druid comes equipped with launch scripts that can be used to start all processes on a single server. Here, we will use [`auto`](../operations/single-server.md#druid-auto-start), which automatically sets various runtime properties based on available processors and memory.
+
+In addition, Druid includes several [bundled non-automatic profiles](../operations/single-server.md) for a range of machine sizes. These range from nano (1 CPU, 4GiB RAM) to x-large (64 CPU, 512GiB RAM). 
+We won't use those here, but for more information, see [Single server deployment](../operations/single-server.md). For additional information on deploying Druid services across clustered machines, see [Clustered deployment](./cluster.md).
 
 The software requirements for the installation machine are:
 
 * Linux, Mac OS X, or other Unix-like OS. (Windows is not supported.)
 * Java 8u92+ or Java 11.
+* [Python2 or Python3](../operations/python.md)
 
 > Druid relies on the environment variables `JAVA_HOME` or `DRUID_JAVA_HOME` to find Java on the machine. You can set
 `DRUID_JAVA_HOME` if there is more than one instance of Java. To verify Java requirements for your environment, run the 
@@ -72,30 +72,31 @@ The distribution directory contains `LICENSE` and `NOTICE` files and subdirector
 
 ## Start up Druid services
 
-Start up Druid services using the `micro-quickstart` single-machine configuration.
+Start up Druid services using the `auto` single-machine configuration.
 This configuration includes default settings that are appropriate for this tutorial, such as loading the `druid-multi-stage-query` extension by default so that you can use the MSQ task engine.
 
-You can view that setting and others in the configuration files in the `conf/druid/single-server/micro-quickstart/`. 
+You can view that setting and others in the configuration files in the `conf/druid/auto`. 
 
 From the apache-druid-{{DRUIDVERSION}} package root, run the following command:
 
 ```bash
-./bin/start-micro-quickstart
+./bin/start-druid
 ```
 
 This brings up instances of ZooKeeper and the Druid services:
 
 ```bash
-$ ./bin/start-micro-quickstart
-[Thu Sep  8 18:30:00 2022] Starting Apache Druid.
-[Thu Sep  8 18:30:00 2022] Open http://localhost:8888/ in your browser to access the web console.
-[Thu Sep  8 18:30:00 2022] Or, if you have enabled TLS, use https on port 9088.
-[Thu Sep  8 18:30:00 2022] Running command[zk], logging to[/apache-druid-{{DRUIDVERSION}}/var/sv/zk.log]: bin/run-zk conf
-[Thu Sep  8 18:30:00 2022] Running command[coordinator-overlord], logging to[/apache-druid-{{DRUIDVERSION}}/var/sv/coordinator-overlord.log]: bin/run-druid coordinator-overlord conf/druid/single-server/micro-quickstart
-[Thu Sep  8 18:30:00 2022] Running command[broker], logging to[/apache-druid-{{DRUIDVERSION}}/var/sv/broker.log]: bin/run-druid broker conf/druid/single-server/micro-quickstart
-[Thu Sep  8 18:30:00 2022] Running command[router], logging to[/apache-druid-{{DRUIDVERSION}}/var/sv/router.log]: bin/run-druid router conf/druid/single-server/micro-quickstart
-[Thu Sep  8 18:30:00 2022] Running command[historical], logging to[/apache-druid-{{DRUIDVERSION}}/var/sv/historical.log]: bin/run-druid historical conf/druid/single-server/micro-quickstart
-[Thu Sep  8 18:30:00 2022] Running command[middleManager], logging to[/apache-druid-{{DRUIDVERSION}}/var/sv/middleManager.log]: bin/run-druid middleManager conf/druid/single-server/micro-quickstart
+$ ./bin/start-druid
+[Tue Nov 29 16:31:06 2022] Starting Apache Druid.
+[Tue Nov 29 16:31:06 2022] Open http://localhost:8888/ in your browser to access the web console.
+[Tue Nov 29 16:31:06 2022] Or, if you have enabled TLS, use https on port 9088.
+[Tue Nov 29 16:31:06 2022] Starting services with log directory [/apache-druid-{{DRUIDVERSION}}/log].
+[Tue Nov 29 16:31:06 2022] Running command[zk]: bin/run-zk conf
+[Tue Nov 29 16:31:06 2022] Running command[broker]: bin/run-druid broker /apache-druid-{{DRUIDVERSION}}/conf/druid/single-server/quickstart '-Xms1187m -Xmx1187m -XX:MaxDirectMemorySize=791m'
+[Tue Nov 29 16:31:06 2022] Running command[router]: bin/run-druid router /apache-druid-{{DRUIDVERSION}}/conf/druid/single-server/quickstart '-Xms128m -Xmx128m'
+[Tue Nov 29 16:31:06 2022] Running command[coordinator-overlord]: bin/run-druid coordinator-overlord /apache-druid-{{DRUIDVERSION}}/conf/druid/single-server/quickstart '-Xms1290m -Xmx1290m'
+[Tue Nov 29 16:31:06 2022] Running command[historical]: bin/run-druid historical /apache-druid-{{DRUIDVERSION}}/conf/druid/single-server/quickstart '-Xms1376m -Xmx1376m -XX:MaxDirectMemorySize=2064m'
+[Tue Nov 29 16:31:06 2022] Running command[middleManager]: bin/run-druid middleManager /apache-druid-{{DRUIDVERSION}}/conf/druid/single-server/quickstart '-Xms64m -Xmx64m' '-Ddruid.worker.capacity=2 -Ddruid.indexer.runner.javaOptsArray=["-server","-Duser.timezone=UTC","-Dfile.encoding=UTF-8","-XX:+ExitOnOutOfMemoryError","-Djava.util.logging.manager=org.apache.logging.log4j.jul.LogManager","-Xms256m","-Xmx256m","-XX:MaxDirectMemorySize=256m"]'
 ```
 
 All persistent state, such as the cluster metadata store and segments for the services, are kept in the `var` directory under 
@@ -103,7 +104,7 @@ the Druid root directory, apache-druid-{{DRUIDVERSION}}. Each service writes to
 
 At any time, you can revert Druid to its original, post-installation state by deleting the entire `var` directory. You may want to do this, for example, between Druid tutorials or after experimentation, to start with a fresh instance. 
 
-To stop Druid at any time, use CTRL+C in the terminal. This exits the `bin/start-micro-quickstart` script and terminates all Druid processes.
+To stop Druid at any time, use CTRL+C in the terminal. This exits the `bin/start-druid` script and terminates all Druid processes.
 
 ## Open the web console 
 
@@ -222,4 +223,4 @@ See the following topics for more information:
 * [Tutorial: Load stream data from Apache Kafka](./tutorial-kafka.md) to load streaming data from a Kafka topic.
 * [Extensions](../development/extensions.md) for details on Druid extensions.
 
-Remember that after stopping Druid services, you can start clean next time by deleting the `var` directory from the Druid root directory and running the `bin/start-micro-quickstart` script again. You may want to do this before using other data ingestion tutorials, since they use the same Wikipedia datasource.
+Remember that after stopping Druid services, you can start clean next time by deleting the `var` directory from the Druid root directory and running the `bin/start-druid` script again. You may want to do this before using other data ingestion tutorials, since they use the same Wikipedia datasource.
diff --git a/docs/tutorials/tutorial-batch-hadoop.md b/docs/tutorials/tutorial-batch-hadoop.md
index 47cd2d6bcbe5..234e8426b064 100644
--- a/docs/tutorials/tutorial-batch-hadoop.md
+++ b/docs/tutorials/tutorial-batch-hadoop.md
@@ -28,7 +28,7 @@ This tutorial shows you how to load data files into Apache Druid using a remote
 
 For this tutorial, we'll assume that you've already completed the previous
 [batch ingestion tutorial](tutorial-batch.md) using Druid's native batch ingestion system and are using the
-`micro-quickstart` single-machine configuration as described in the [quickstart](index.md).
+`auto` single-machine configuration as described in the [quickstart](../operations/single-server.md#druid-auto-start).
 
 ## Install Docker
 
@@ -156,7 +156,7 @@ cp /tmp/shared/hadoop_xml/*.xml {PATH_TO_DRUID}/conf/druid/single-server/micro-q
 
 ### Update Druid segment and log storage
 
-In your favorite text editor, open `conf/druid/single-server/micro-quickstart/_common/common.runtime.properties`, and make the following edits:
+In your favorite text editor, open `conf/druid/auto/_common/common.runtime.properties`, and make the following edits:
 
 #### Disable local deep storage and enable HDFS deep storage
 
@@ -196,7 +196,7 @@ druid.indexer.logs.directory=/druid/indexing-logs
 
 Once the Hadoop .xml files have been copied to the Druid cluster and the segment/log storage configuration has been updated to use HDFS, the Druid cluster needs to be restarted for the new configurations to take effect.
 
-If the cluster is still running, CTRL-C to terminate the `bin/start-micro-quickstart` script, and re-run it to bring the Druid services back up.
+If the cluster is still running, CTRL-C to terminate the `bin/start-druid` script, and re-run it to bring the Druid services back up.
 
 ## Load batch data
 
@@ -221,7 +221,7 @@ This tutorial is only meant to be used together with the [query tutorial](../tut
 
 If you wish to go through any of the other tutorials, you will need to:
 * Shut down the cluster and reset the cluster state by removing the contents of the `var` directory under the druid package.
-* Revert the deep storage and task storage config back to local types in `conf/druid/single-server/micro-quickstart/_common/common.runtime.properties`
+* Revert the deep storage and task storage config back to local types in `conf/druid/auto/_common/common.runtime.properties`
 * Restart the cluster
 
 This is necessary because the other ingestion tutorials will write to the same "wikipedia" datasource, and later tutorials expect the cluster to use local deep storage.
diff --git a/docs/tutorials/tutorial-jdbc.md b/docs/tutorials/tutorial-jdbc.md
new file mode 100644
index 000000000000..28cee144c3b0
--- /dev/null
+++ b/docs/tutorials/tutorial-jdbc.md
@@ -0,0 +1,31 @@
+---
+id: tutorial-jdbc
+title: "Tutorial: Using the JDBC driver to query Druid"
+sidebar_label: JDBC connector
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Redirecting you to the JDBC connector examples...
+
+<script>window.location.replace("https://druid.apache.org/docs/latest/querying/sql-jdbc.html#examples")</script>
+</head>
+<a href="https://druid.apache.org/docs/latest/querying/sql-jdbc.html#examples">Click here if you are not redirected.</a>
+
diff --git a/docs/tutorials/tutorial-kafka.md b/docs/tutorials/tutorial-kafka.md
index eb06f4239f95..0a47d3237fa6 100644
--- a/docs/tutorials/tutorial-kafka.md
+++ b/docs/tutorials/tutorial-kafka.md
@@ -30,7 +30,7 @@ The tutorial guides you through the steps to load sample nested clickstream data
 
 ## Prerequisites
 
-Before you follow the steps in this tutorial, download Druid as described in the [quickstart](index.md) using the [micro-quickstart](../operations/single-server.md#micro-quickstart-4-cpu-16gib-ram) single-machine configuration and have it running on your local machine. You don't need to have loaded any data.
+Before you follow the steps in this tutorial, download Druid as described in the [quickstart](index.md) using the [auto](../operations/single-server.md#druid-auto-start) single-machine configuration and have it running on your local machine. You don't need to have loaded any data.
 
 ## Download and start Kafka
 
diff --git a/examples/bin/run-druid b/examples/bin/run-druid
index c302672209a0..4be0afc5854b 100755
--- a/examples/bin/run-druid
+++ b/examples/bin/run-druid
@@ -17,7 +17,7 @@
 # specific language governing permissions and limitations
 # under the License.
 
-if [ "$#" -gt 2 ] || [ "$#" -eq 0 ]
+if [ "$#" -gt 4 ] || [ "$#" -eq 0 ]
 then
   >&2 echo "usage: $0 <service> [conf-dir]"
   exit 1
@@ -47,7 +47,45 @@ if [ ! -d "$LOG_DIR" ]; then mkdir -p $LOG_DIR; fi
 
 echo "Running [$1], logging to [$LOG_DIR/$1.log] if no changes made to log4j2.xml"
 
+if [ "$WHATAMI" = 'coordinator-overlord' ]
+then
+    SERVER_NAME=coordinator
+else
+    SERVER_NAME="$WHATAMI"
+fi
+
+
+if [ ! -f "$CONFDIR"/$WHATAMI/main.config ];
+  then
+    MAIN_CLASS="org.apache.druid.cli.Main server $SERVER_NAME"
+  else
+    MAIN_CLASS=`cat "$CONFDIR"/$WHATAMI/main.config | xargs`
+fi
+
 cd "$WHEREAMI/.."
-exec "$WHEREAMI"/run-java -Ddruid.node.type=$1 "-Ddruid.log.path=$LOG_DIR" `cat "$CONFDIR"/"$WHATAMI"/jvm.config | xargs` \
-  -cp "$CONFDIR"/"$WHATAMI":"$CONFDIR"/_common:"$CONFDIR"/_common/hadoop-xml:"$CONFDIR"/../_common:"$CONFDIR"/../_common/hadoop-xml:"$WHEREAMI/../lib/*" \
-  `cat "$CONFDIR"/$WHATAMI/main.config | xargs`
+
+CLASS_PATH="$CONFDIR"/"$WHATAMI":"$CONFDIR"/_common:"$CONFDIR"/_common/hadoop-xml:"$CONFDIR"/../_common:"$CONFDIR"/../_common/hadoop-xml:"$WHEREAMI/../lib/*"
+
+if [ "$#" -eq 3 ] || [ "$#" -eq 4 ]
+then
+  # args: <service> <conf_path> <jvm_args> or <service> <conf_path> <jvm_args> <mm_task_count mm_task_java_props>
+  JVMARGS=`cat "$CONFDIR/_common/common.jvm.config" | xargs`
+  JVMARGS+=' '
+  JVMARGS+=$3
+
+  if [ "$#" -eq 3 ]
+  then
+    # args: <service> <conf_path> <jvm_args>
+    exec "$WHEREAMI"/run-java -Ddruid.node.type=$1 "-Ddruid.log.path=$LOG_DIR" $JVMARGS \
+      -cp $CLASS_PATH $MAIN_CLASS
+  else
+    # args: <service> <conf_path> <jvm_args> <mm_task_count mm_task_java_props>
+    exec "$WHEREAMI"/run-java -Ddruid.node.type=$1 $4 "-Ddruid.log.path=$LOG_DIR"  $JVMARGS \
+      -cp $CLASS_PATH $MAIN_CLASS
+  fi
+else
+  # args: <service> <conf_path>
+  exec "$WHEREAMI"/run-java -Ddruid.node.type=$1 "-Ddruid.log.path=$LOG_DIR" \
+    `cat "$CONFDIR"/"$WHATAMI"/jvm.config | xargs` \
+    -cp  $CLASS_PATH $MAIN_CLASS
+fi
diff --git a/examples/bin/start-druid b/examples/bin/start-druid
new file mode 100755
index 000000000000..81d8938adbb2
--- /dev/null
+++ b/examples/bin/start-druid
@@ -0,0 +1,35 @@
+#!/bin/bash -eu
+
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+PWD="$(pwd)"
+WHEREAMI="$(dirname "$0")"
+WHEREAMI="$(cd "$WHEREAMI" && pwd)"
+
+if [ -x "$(command -v python3)" ]
+then
+  exec python3 "$WHEREAMI/start-druid-main.py" "$@"
+elif [ -x "$(command -v python2)" ]
+then
+  exec python2 "$WHEREAMI/start-druid-main.py" "$@"
+elif [ -x "$(command -v python)" ]
+then
+  exec python "$WHEREAMI/start-druid-main.py" "$@"
+else
+  echo "python interepreter not found"
+fi
diff --git a/examples/bin/start-druid-main.py b/examples/bin/start-druid-main.py
new file mode 100644
index 000000000000..d1f4e6114918
--- /dev/null
+++ b/examples/bin/start-druid-main.py
@@ -0,0 +1,641 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+import sys
+import os
+import multiprocessing
+import argparse
+import subprocess
+import platform
+
+BASE_CONFIG_PATH = "conf/druid/auto"
+
+MEM_GB_SUFFIX = "g"
+MEM_MB_SUFFIX = "m"
+XMX_PARAMETER = "-Xmx"
+XMS_PARAMETER = "-Xms"
+DIRECT_MEM_PARAMETER = "-XX:MaxDirectMemorySize"
+SERVICE_SEPARATOR = ","
+
+TASK_JAVA_OPTS_ARRAY = ["-server", "-Duser.timezone=UTC", "-Dfile.encoding=UTF-8", "-XX:+ExitOnOutOfMemoryError",
+                        "-Djava.util.logging.manager=org.apache.logging.log4j.jul.LogManager"]
+TASK_JAVA_OPTS_PROPERTY = "druid.indexer.runner.javaOptsArray"
+TASK_WORKER_CAPACITY_PROPERTY = "druid.worker.capacity"
+TASK_COUNT = "task-count"
+TASK_MEM_TYPE_LOW = "low"
+TASK_MEM_TYPE_HIGH = "high"
+TASK_MEM_MAP = {
+    TASK_MEM_TYPE_LOW: ["-Xms256m", "-Xmx256m", "-XX:MaxDirectMemorySize=256m"],
+    TASK_MEM_TYPE_HIGH: ["-Xms1g", "-Xmx1g", "-XX:MaxDirectMemorySize=1g"]
+}
+
+BROKER = "broker"
+ROUTER = "router"
+COORDINATOR = "coordinator-overlord"
+HISTORICAL = "historical"
+MIDDLE_MANAGER = "middleManager"
+TASKS = "tasks"
+INDEXER = "indexer"
+
+DEFAULT_SERVICES = [
+    BROKER,
+    ROUTER,
+    COORDINATOR,
+    HISTORICAL,
+    MIDDLE_MANAGER
+]
+
+SUPPORTED_SERVICES = [
+    BROKER,
+    ROUTER,
+    COORDINATOR,
+    HISTORICAL,
+    MIDDLE_MANAGER,
+    INDEXER
+]
+
+SERVICE_MEMORY_RATIO = {
+    MIDDLE_MANAGER: 1,
+    ROUTER: 2,
+    COORDINATOR: 30,
+    BROKER: 46,
+    HISTORICAL: 80,
+    TASKS: 30,
+    INDEXER: 32
+}
+
+MINIMUM_MEMORY_MB = {
+    MIDDLE_MANAGER: 64,
+    ROUTER: 128,
+    TASKS: 1024,
+    BROKER: 900,
+    COORDINATOR: 256,
+    HISTORICAL: 900,
+    INDEXER: 1124
+}
+
+HEAP_TO_TOTAL_MEM_RATIO = {
+    MIDDLE_MANAGER: 1,
+    ROUTER: 1,
+    COORDINATOR: 1,
+    BROKER: 0.60,
+    HISTORICAL: 0.40,
+    TASKS: 0.50,
+    INDEXER: 0.50
+}
+
+LOGGING_ENABLED = False
+
+
+def print_if_verbose(message):
+    if LOGGING_ENABLED:
+        print(message)
+
+
+def configure_parser():
+    parser = argparse.ArgumentParser(
+        prog='start-druid',
+        formatter_class=argparse.RawTextHelpFormatter,
+        epilog=
+        """
+sample usage:
+    start-druid
+            Start up all the services (including zk).
+    start-druid -m=100g
+            Start up all the services (including zk)
+            using a total memory of 100GB.
+    start-druid -m=100g --compute
+            Compute memory distribution and validate arguments.
+    start-druid -m=100g -s=broker,router
+            Starts a broker and a router, using a total memory of 100GB.
+    start-druid -m=100g --s=broker,router \\
+    -c=conf/druid/single-server/custom
+            Starts a broker and a router, using a total memory of 100GB.
+            Reads configs for each service (jvm.config, runtime.properties)
+            from respective folders inside the given root config path.
+    start-druid -s=broker,router \\
+    -c=conf/druid/single-server/custom
+            Starts a broker and a router service, reading service configs
+            from the given root directory. Calculates memory requirements for
+            each service, if required, using upto 80% of the total system memory.
+    start-druid -m=100g \\
+    -s=broker,router \\
+    -c=conf/druid/single-server/custom \\
+    --zk
+            Starts broker, router and zookeeper.
+            zookeeper config is read from conf/zk.
+"""
+    )
+    parser.add_argument('--memory', '-m', type=str, required=False,
+                        help='Total memory for all processes (services and tasks, if any). \n'
+                             'This parameter is ignored if each service already has a jvm.config \n'
+                             'in the given conf directory. e.g. 500m, 4g, 6g\n')
+    parser.add_argument('--services', '-s', type=str, required=False,
+                        help='List of services to be started, subset of \n'
+                             '{broker, router, middleManager, historical, coordinator-overlord, indexer}. \n'
+                             'If the argument is not given, broker, router, middleManager, historical, coordinator-overlord  \n'
+                             'and zookeeper is started. e.g. -s=broker,historical')
+    parser.add_argument('--config', '-c', type=str, required=False,
+                        help='Relative path to the directory containing common and service \n'
+                             'specific properties to be overridden. \n'
+                             'This directory must contain \'_common\' directory with \n'
+                             '\'common.jvm.config\' & \'common.runtime.properties\' files. \n'
+                             'If this argument is not given, config from \n'
+                             'conf/druid/auto directory is used.\n')
+    parser.add_argument('--compute', action='store_true',
+                        help='Does not start Druid, only displays the memory allocated \n'
+                             'to each service if started with the given total memory.\n')
+    parser.add_argument('--zk', '-zk', action='store_true',
+                        help='Specification to run zookeeper, \n'
+                             'zk config is picked up from conf/zk.')
+    parser.add_argument('--verbose', action='store_true', help='Log details')
+
+    parser.set_defaults(zk=False)
+    parser.set_defaults(compute=False)
+    parser.set_defaults(verbose=False)
+
+    return parser
+
+
+def is_file(path):
+    return os.path.isfile(path)
+
+
+def is_dir(path):
+    return os.path.isdir(path)
+
+
+def resolve_path(path):
+    return os.path.abspath(path)
+
+
+def validate_common_jvm_args(config):
+    if is_file('{0}/_common/common.jvm.config'.format(config)) is False:
+        raise ValueError('_common/common.jvm.config file is missing in the root config, '
+                         'check {0}/_common directory'.format(BASE_CONFIG_PATH))
+
+
+def validate_common_directory(config):
+    if is_dir('{0}/_common'.format(config)) is False:
+        raise ValueError(
+            '_common directory is missing in the root config, check {0}/_common directory'.format(BASE_CONFIG_PATH))
+
+    if is_file('{0}/_common/common.runtime.properties'.format(config)) is False:
+        raise ValueError('_common/common.runtime.properties file is missing in the root config, '
+                         'check {0}/_common directory'.format(BASE_CONFIG_PATH))
+
+
+def parse_arguments(args):
+    service_list = []
+    config = ""
+    total_memory = ""
+    compute = False
+    zk = False
+
+    if args.compute:
+        compute = True
+    if args.zk:
+        zk = True
+    if args.config is not None:
+        config = resolve_path(os.path.join(os.getcwd(), args.config))
+        if is_dir(config) is False:
+            raise ValueError('config {0} not found'.format(config))
+    if args.memory is not None:
+        total_memory = args.memory
+    if args.services is not None:
+        services = args.services.split(SERVICE_SEPARATOR)
+
+        for service in services:
+            if service not in SUPPORTED_SERVICES:
+                raise ValueError('Invalid service name {0}, should be one of {1}'.format(service, DEFAULT_SERVICES))
+
+            if service in service_list:
+                raise ValueError('{0} is specified multiple times'.format(service))
+
+            service_list.append(service)
+
+        if INDEXER in services and MIDDLE_MANAGER in services:
+            raise ValueError('one of indexer and middleManager can run')
+
+    if len(service_list) == 0:
+        # start all services
+        service_list = DEFAULT_SERVICES
+        zk = True
+
+    return config, total_memory, service_list, zk, compute
+
+
+def print_startup_config(service_list, config, zk):
+    print_if_verbose('Starting {0}'.format(service_list))
+    print_if_verbose('Reading config from {0}'.format(config))
+    if zk:
+        zk_config = resolve_path('{0}/../conf/zk'.format(os.getcwd()))
+        print_if_verbose('Starting zk, reading default config from {0}'.format(zk_config))
+    print_if_verbose('\n')
+
+
+def task_memory_params_present(config, service):
+    java_opts_property_present = False
+    worker_capacity_property_present = False
+
+    if is_file('{0}/{1}/runtime.properties'.format(config, service)):
+        with open('{0}/{1}/runtime.properties'.format(config, service)) as file:
+            for line in file:
+                if line.startswith(TASK_JAVA_OPTS_PROPERTY):
+                    java_opts_property_present = True
+                elif line.startswith(TASK_WORKER_CAPACITY_PROPERTY):
+                    worker_capacity_property_present = True
+
+    return java_opts_property_present, worker_capacity_property_present
+
+
+def verify_service_config(service, config):
+    path = '{0}/{1}/jvm.config'.format(config, service)
+
+    required_parameters = [XMX_PARAMETER, XMS_PARAMETER]
+
+    if HEAP_TO_TOTAL_MEM_RATIO.get(service) != 1:
+        required_parameters.append(DIRECT_MEM_PARAMETER)
+
+    with open(path) as file:
+        for line in file:
+            if line.startswith(XMX_PARAMETER) and XMX_PARAMETER in required_parameters:
+                required_parameters.remove(XMX_PARAMETER)
+            if line.startswith(XMS_PARAMETER) and XMS_PARAMETER in required_parameters:
+                required_parameters.remove(XMS_PARAMETER)
+            if line.startswith(DIRECT_MEM_PARAMETER) and DIRECT_MEM_PARAMETER in required_parameters:
+                required_parameters.remove(DIRECT_MEM_PARAMETER)
+
+    if len(required_parameters) > 0:
+        params = ",".join(required_parameters)
+        raise ValueError('{0} missing in {1}/jvm.config'.format(params, service))
+
+    if service == MIDDLE_MANAGER:
+        if is_file('{0}/{1}/runtime.properties'.format(config, service)) is False:
+            raise ValueError('{0}/runtime.properties file is missing in the root config'.format(service))
+
+        mm_task_java_opts_prop, mm_task_worker_capacity_prop = task_memory_params_present(config, MIDDLE_MANAGER)
+
+        if mm_task_java_opts_property is False:
+            raise ValueError('{0} property missing in {1}/runtime.properties'.format(TASK_JAVA_OPTS_PROPERTY, service))
+
+
+def should_compute_memory(config, total_memory, service_list):
+    """
+    if memory argument is given, memory for services and tasks is computed, jvm.config file
+    or runtime.properties with task memory specification shouldn't be present
+    Alternatively, all memory related parameters are specified
+    which implies following should be present:
+    jvm.config file for all services with -Xmx=***, Xms=*** parameters
+    -XX:MaxDirectMemorySize=** in jvm.config for broker and historical
+    druid.indexer.runner.javaOptsArray (optionally druid.worker.capacity) in
+    rootDirectory/middleManager/runtime.properties
+    """
+
+    jvm_config_count = 0
+    for service in service_list:
+        if is_file('{0}/{1}/jvm.config'.format(config, service)):
+            jvm_config_count += 1
+
+    mm_task_property_present = False
+    if MIDDLE_MANAGER in service_list:
+        mm_task_java_opts_prop, mm_task_worker_capacity_prop = task_memory_params_present(config, MIDDLE_MANAGER)
+        mm_task_property_present = mm_task_java_opts_prop or mm_task_worker_capacity_prop
+
+    indexer_task_worker_capacity_prop = False
+    if INDEXER in service_list:
+        indexer_task_java_opts_prop, indexer_task_worker_capacity_prop = task_memory_params_present(config, INDEXER)
+
+    # possible error states
+    # 1. memory argument is specified, also jvm.config or middleManger/runtime.properties having
+    # druid.indexer.runner.javaOptsArray or druid.worker.capacity parameters is present
+    # 2. jvm.config is not present for any service, but middleManger/runtime.properties has
+    # druid.indexer.runner.javaOptsArray or druid.worker.capacity parameters
+    # or indexer/runtime.properties has druid.worker.capacity
+    # 3. jvm.config present for some but not all services
+    # 4. jvm.config file is present for all services, but it doesn't contain required parameters
+    # 5. lastly, if middleManager is to be started, and it is missing task memory properties
+    if jvm_config_count > 0 or mm_task_property_present or indexer_task_worker_capacity_prop:
+        if total_memory != "":
+            raise ValueError(
+                "If jvm.config for services and/or middleManager/indexer configs "
+                "(druid.worker.capacity, druid.indexer.runner.javaOptsArray) is present, "
+                "memory argument shouldn't be specified")
+        if jvm_config_count == 0 and mm_task_property_present:
+            raise ValueError("middleManger configs (druid.indexer.runner.javaOptsArray or druid.worker.capacity) "
+                             "is present in middleManager/runtime.properties, "
+                             "add jvm.config for all other services")
+        if jvm_config_count == 0 and indexer_task_worker_capacity_prop:
+            raise ValueError("indexer configs (druid.worker.capacity) "
+                             "is present in indexer/runtime.properties, "
+                             "add jvm.config for all other services")
+        if jvm_config_count != len(service_list):
+            raise ValueError("jvm.config file should be present for all services or none")
+        for service in service_list:
+            verify_service_config(service, config)
+
+        return False
+
+    # compute memory only when none of the specified services contains jvm.config,
+    # if middleManager is to be started it shouldn't contain task memory properties
+    # if indexer is present it shouldn't contain task memory properties
+    return True
+
+
+def get_physical_memory_linux():
+    mem_bytes = os.sysconf('SC_PAGE_SIZE') * os.sysconf('SC_PHYS_PAGES')
+    mem_mbs = int(mem_bytes / (1024 * 1024))
+    return mem_mbs
+
+
+def get_physical_memory_osx():
+    p1 = subprocess.Popen(['sysctl', '-a'], stdout=subprocess.PIPE)
+    p2 = subprocess.check_output(['grep', 'hw.memsize'], stdin=p1.stdout)
+    p2 = p2.decode('utf-8')
+    fields = p2.split(':')
+
+    mem_mbs = int(int(fields[1]) / (1024 * 1024))
+
+    return mem_mbs
+
+
+def get_physical_memory():
+    operating_system = platform.system()
+    print_if_verbose('operating system is {0}'.format(operating_system))
+
+    system_memory = None
+
+    try:
+        if operating_system == 'Darwin':
+            system_memory = get_physical_memory_osx()
+        elif operating_system == 'Linux':
+            system_memory = get_physical_memory_linux()
+    except Exception:
+        pass
+
+    return system_memory
+
+
+def convert_total_memory_string(memory):
+    try:
+        if memory == '':
+            physical_memory = get_physical_memory()
+
+            if physical_memory is None:
+                raise ValueError('Please specify memory argument')
+
+            return physical_memory
+        elif memory.endswith(MEM_MB_SUFFIX):
+            return int(memory[:-1])
+        elif memory.endswith(MEM_GB_SUFFIX):
+            return 1024 * int(memory[:-1])
+        else:
+            raise ValueError('Incorrect format for memory argument, expected format is <integer_value><m/g>')
+    except ValueError as e:
+        raise e
+    except Exception:
+        raise ValueError('Incorrect format for memory argument, expected format is <integer_value><m/g>')
+
+
+def check_memory_constraint(total_memory, services):
+    # 80% of total memory >= sum of lower bound service memory should be
+    lower_bound_memory = 0
+
+    service_list = list(services)
+    if MIDDLE_MANAGER in services:
+        service_list.append(TASKS)
+
+    for service in service_list:
+        lower_bound_memory += MINIMUM_MEMORY_MB.get(service)
+
+    required_memory = int(lower_bound_memory / 0.8)
+
+    if total_memory < required_memory:
+        raise ValueError('Minimum memory required for starting services is {0}m'.format(required_memory))
+
+    if total_memory >= 2 * lower_bound_memory:
+        return int(total_memory / 2)
+    else:
+        return lower_bound_memory
+
+
+def build_mm_task_java_opts_array(memory_type):
+    task_memory = '-D{0}=['.format(TASK_JAVA_OPTS_PROPERTY)
+
+    mem_array = TASK_MEM_MAP.get(memory_type)
+
+    java_opts_list = TASK_JAVA_OPTS_ARRAY + mem_array
+
+    for item in java_opts_list:
+        task_memory += '\"{0}\",'.format(item)
+
+    task_memory = task_memory[:-1]
+    task_memory += ']'
+    return task_memory
+
+
+def compute_tasks_memory(allocated_memory):
+    if allocated_memory >= 4096:
+        task_count = int(allocated_memory / 2048)
+        memory_type = TASK_MEM_TYPE_HIGH
+        task_memory_mb = 2048
+    else:
+        task_count = 2
+        memory_type = TASK_MEM_TYPE_LOW
+        task_memory_mb = 512
+    task_count = min(task_count, multiprocessing.cpu_count())
+
+    return memory_type, task_count, task_memory_mb
+
+
+def build_memory_config(service, allocated_memory):
+    if service == TASKS:
+        memory_type, task_count, task_memory = compute_tasks_memory(allocated_memory)
+        java_opts_array = build_mm_task_java_opts_array(memory_type)
+        return ['-D{0}={1}'.format(TASK_WORKER_CAPACITY_PROPERTY, task_count),
+                java_opts_array], task_memory * task_count
+    elif service == INDEXER:
+        heap_memory = HEAP_TO_TOTAL_MEM_RATIO.get(service) * allocated_memory
+        direct_memory = int(allocated_memory - heap_memory)
+        heap_memory = int(heap_memory)
+        memory_type, task_count, task_memory = compute_tasks_memory(allocated_memory)
+        return ['-D{0}={1}'.format(TASK_WORKER_CAPACITY_PROPERTY, task_count),
+                '-Xms{0}m -Xmx{0}m -XX:MaxDirectMemorySize={1}m'.format(heap_memory, direct_memory)], \
+               task_memory * task_count
+    else:
+        heap_memory = HEAP_TO_TOTAL_MEM_RATIO.get(service) * allocated_memory
+        direct_memory = int(allocated_memory - heap_memory)
+        heap_memory = int(heap_memory)
+
+        if direct_memory == 0:
+            return '-Xms{0}m -Xmx{0}m'.format(heap_memory), allocated_memory
+
+        return '-Xms{0}m -Xmx{0}m -XX:MaxDirectMemorySize={1}m'.format(heap_memory, direct_memory), allocated_memory
+
+
+def distribute_memory(services, total_memory):
+    service_memory_config = {}
+
+    memory_weight_sum = 0
+
+    service_list = list(services)
+    if MIDDLE_MANAGER in services:
+        service_list.append(TASKS)
+
+    for service in service_list:
+        memory_weight_sum += SERVICE_MEMORY_RATIO.get(service)
+
+    multiplier = total_memory / memory_weight_sum
+
+    lower_bound_memory_allocation = 0
+    allocated_services = set()
+
+    for service in service_list:
+        allocated_memory = SERVICE_MEMORY_RATIO.get(service) * multiplier
+        if service in MINIMUM_MEMORY_MB and allocated_memory < MINIMUM_MEMORY_MB.get(service):
+            allocated_memory = MINIMUM_MEMORY_MB.get(service)
+            service_memory_config[service], allocated_memory = build_memory_config(service, allocated_memory)
+            lower_bound_memory_allocation += allocated_memory
+            allocated_services.add(service)
+
+    if lower_bound_memory_allocation > 0:
+        # compute the multiplier again for remaining services
+        memory_weight_sum = 0
+        for service in service_list:
+            if service in allocated_services:
+                continue
+            memory_weight_sum += SERVICE_MEMORY_RATIO.get(service)
+        multiplier = (total_memory - lower_bound_memory_allocation) / memory_weight_sum
+
+    for service in service_list:
+        if service in allocated_services:
+            continue
+        allocated_memory = SERVICE_MEMORY_RATIO.get(service) * multiplier
+        if service in MINIMUM_MEMORY_MB and allocated_memory < MINIMUM_MEMORY_MB.get(service):
+            allocated_memory = MINIMUM_MEMORY_MB.get(service)
+
+        service_memory_config[service], allocated_memory = build_memory_config(service, allocated_memory)
+
+    print_if_verbose('\nMemory distribution for services:')
+    for key, value in service_memory_config.items():
+        print_if_verbose('{0}, {1}'.format(key, value))
+    print_if_verbose('\n')
+
+    return service_memory_config
+
+
+def append_command(commands, command):
+    commands.append('--command')
+    commands.append(command)
+
+
+def build_supervise_script_arguments(service_list, service_memory_config, config, zk):
+    commands = []
+    commands.append('supervise')
+
+    append_command(commands, ":verify bin/verify-java")
+    append_command(commands, ":verify bin/verify-default-ports")
+    append_command(commands, ":notify bin/greet")
+    append_command(commands, ":kill-timeout 10")
+
+    if zk:
+        append_command(commands, "!p10 zk bin/run-zk conf")
+
+    for service in service_list:
+        memory_config = service_memory_config.get(service)
+
+        prefix = ''
+        if service == MIDDLE_MANAGER:
+            prefix = '!p90 '
+
+        if memory_config is None:
+            append_command(commands, '{0}{1} bin/run-druid {1} {2}'.format(prefix, service, config))
+        else:
+            if service == MIDDLE_MANAGER:
+                task_config = service_memory_config.get(TASKS)
+                task_count = task_config[0]
+                task_memory = task_config[1]
+                append_command(
+                    commands,
+                    '{0}{1} bin/run-druid {1} {2} \'{3}\' \'{4} {5}\''
+                    .format(prefix, service, config, memory_config, task_count, task_memory))
+            elif service == INDEXER:
+                task_count = memory_config[0]
+                jvm_args = memory_config[1]
+                append_command(
+                    commands,
+                    '{0}{1} bin/run-druid {1} {2} \'{3}\' \'{4}\''
+                    .format(prefix, service, config, jvm_args, task_count))
+            else:
+                append_command(commands,
+                               '{0}{1} bin/run-druid {1} {2} \'{3}\''.format(prefix, service, config, memory_config))
+
+    print_if_verbose('Supervise script args:')
+    for item in commands:
+        print_if_verbose(item)
+
+    print_if_verbose('\n')
+
+    return commands
+
+
+def main():
+    parser = configure_parser()
+    args = parser.parse_args()
+
+    global LOGGING_ENABLED
+    LOGGING_ENABLED = args.verbose or args.compute
+
+    config, total_memory, service_list, zk, compute = parse_arguments(args)
+
+    # change directory to bin
+    os.chdir(os.path.dirname(sys.argv[0]))
+
+    if config == "":
+        config = resolve_path('{0}/../{1}'.format(os.getcwd(), BASE_CONFIG_PATH))
+
+    validate_common_directory(config)
+
+    print_startup_config(service_list, config, zk)
+
+    service_memory_config = {}
+
+    if should_compute_memory(config, total_memory, service_list):
+        # if memory is to be computed, _common directory should contain common.jvm.config
+        validate_common_jvm_args(config)
+        memory_in_mega_bytes = convert_total_memory_string(total_memory)
+        print_if_verbose('Total memory is {0}m\n'.format(memory_in_mega_bytes))
+        memory_to_be_used = check_memory_constraint(memory_in_mega_bytes, service_list)
+        print_if_verbose('Memory used for services & tasks {0}m\n'.format(memory_to_be_used))
+        service_memory_config = distribute_memory(service_list, memory_to_be_used)
+    else:
+        print_if_verbose('Not computing memory distribution, reading memory specification from service jvm.config & '
+                         'middleManager/runtime.properties\n')
+
+    script_arguments = build_supervise_script_arguments(service_list, service_memory_config, config, zk)
+
+    if compute:
+        return
+
+    os.execv('./supervise', script_arguments)
+
+
+try:
+    main()
+except (KeyboardInterrupt, ValueError) as error:
+    print(error)
+    sys.exit(1)
diff --git a/examples/bin/supervise b/examples/bin/supervise
index 81b7e57b049e..ba336c31aa66 100755
--- a/examples/bin/supervise
+++ b/examples/bin/supervise
@@ -46,6 +46,51 @@ sub usage
   die "usage: $0 -c <conf file> [-d <var dir>] [-t <kill timeout>] [--svlogd <optional conf file>]\n";
 }
 
+sub process_config
+{
+    my @lines = @_;
+    my @commands;
+    my @verify;
+    my @notify;
+    my $kill_timeout;
+    for my $line (@lines)
+    {
+        if ($line =~ /^(:verify|:notify|:kill-timeout|(?:\!p[0-9]+\s+)?[^:]\S+)\s+(.+)$/) {
+          my $name = $1;
+          my $order = 50;
+          my $command = $2;
+
+          if ($name =~ /^(?:\!p([0-9]+)\s+)(.*)$/) {
+            $order = $1;
+            $name = $2;
+          }
+
+          if ($name eq ':verify') {
+            push @verify, $command;
+          } elsif ($name eq ':notify') {
+            push @notify, $command;
+          } elsif ($name eq ':kill-timeout') {
+            $kill_timeout = int($command);
+          } else {
+            die "Duplicate command: $line\n" if grep { $_->{name} eq $name } @commands;
+            push @commands, {
+              name => $name,
+              command => $command,
+              order => $order,  # Stop order for this command
+              pid => 0,         # Current pid, or 0 if not running
+              down => 0,        # Time the proc should be down until
+              killed => 0,      # Signal we sent to this process
+              restarting => 0,  # True if this command is currently restarting
+            };
+          }
+        } else {
+          die "Syntax error: $line\n";
+        }
+    }
+
+    return { commands => \@commands, verify => \@verify, notify => \@notify, 'kill-timeout' => $kill_timeout };
+}
+
 sub read_config_file
 {
   my ($config_file) = @_;
@@ -53,49 +98,20 @@ sub read_config_file
   open my $config_fh, "<", $config_file
     or die "open $config_file: $!";
 
-  my @commands;
-  my @verify;
-  my @notify;
-  my $kill_timeout;
+  my @lines;
   while (my $line = <$config_fh>) {
     chomp $line;
     next if $line =~ /^(\s*\#.*|\s*)$/;
 
     if ($line =~ /^(:verify|:notify|:kill-timeout|(?:\!p[0-9]+\s+)?[^:]\S+)\s+(.+)$/) {
-      my $name = $1;
-      my $order = 50;
-      my $command = $2;
-
-      if ($name =~ /^(?:\!p([0-9]+)\s+)(.*)$/) {
-        $order = $1;
-        $name = $2;
-      }
-
-      if ($name eq ':verify') {
-        push @verify, $command;
-      } elsif ($name eq ':notify') {
-        push @notify, $command;
-      } elsif ($name eq ':kill-timeout') {
-        $kill_timeout = int($command);
-      } else {
-        die "Duplicate command: $line\n" if grep { $_->{name} eq $name } @commands;
-        push @commands, {
-          name => $name,
-          command => $command,
-          order => $order,  # Stop order for this command
-          pid => 0,         # Current pid, or 0 if not running
-          down => 0,        # Time the proc should be down until
-          killed => 0,      # Signal we sent to this process
-          restarting => 0,  # True if this command is currently restarting
-        };
-      }
+        push @lines, $line
     } else {
       die "Syntax error: $line\n";
     }
   }
 
   close $config_fh;
-  return { commands => \@commands, verify => \@verify, notify => \@notify, 'kill-timeout' => $kill_timeout };
+  return @lines;
 }
 
 sub stringify_exit_status
@@ -179,13 +195,23 @@ usage() unless GetOptions(
   'vardir|d=s',
   'kill-timeout|t=i',
   'chdir=s',
-  'svlogd:s'
+  'svlogd:s',
+  'command=s@'
 );
 
-usage() unless $opt{'conf'} && $opt{'vardir'};
+usage() unless (($opt{'command'} && @{$opt{'command'}}) || $opt{'conf'}) && $opt{'vardir'};
+
+my @config_lines;
+
+# get commands to execute either from reading the config file or command line
+if (not defined $opt{'conf'}) {
+    @config_lines = @{$opt{'command'}}
+} else {
+    @config_lines = read_config_file($opt{'conf'});
+}
+
+my $config = process_config(@config_lines);
 
-# Read config file
-my $config = read_config_file($opt{'conf'});
 @commands = @{$config->{commands}};
 
 if (!@commands) {
diff --git a/examples/conf/druid/auto/_common/common.jvm.config b/examples/conf/druid/auto/_common/common.jvm.config
new file mode 100644
index 000000000000..fd74cf358979
--- /dev/null
+++ b/examples/conf/druid/auto/_common/common.jvm.config
@@ -0,0 +1,7 @@
+-server
+-XX:+ExitOnOutOfMemoryError
+-XX:+UseG1GC
+-Duser.timezone=UTC
+-Dfile.encoding=UTF-8
+-Djava.io.tmpdir=var/tmp
+-Djava.util.logging.manager=org.apache.logging.log4j.jul.LogManager
diff --git a/examples/conf/druid/auto/_common/common.runtime.properties b/examples/conf/druid/auto/_common/common.runtime.properties
new file mode 100644
index 000000000000..b0adb0695cd7
--- /dev/null
+++ b/examples/conf/druid/auto/_common/common.runtime.properties
@@ -0,0 +1,158 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+#
+
+# Extensions specified in the load list will be loaded by Druid
+# We are using local fs for deep storage - not recommended for production - use S3, HDFS, or NFS instead
+# We are using local derby for the metadata store - not recommended for production - use MySQL or Postgres instead
+
+# If you specify `druid.extensions.loadList=[]`, Druid won't load any extension from file system.
+# If you don't specify `druid.extensions.loadList`, Druid will load all the extensions under root extension directory.
+# More info: https://druid.apache.org/docs/latest/operations/including-extensions.html
+druid.extensions.loadList=["druid-hdfs-storage", "druid-kafka-indexing-service", "druid-datasketches", "druid-multi-stage-query"]
+
+# If you have a different version of Hadoop, place your Hadoop client jar files in your hadoop-dependencies directory
+# and uncomment the line below to point to your directory.
+#druid.extensions.hadoopDependenciesDir=/my/dir/hadoop-dependencies
+
+
+#
+# Hostname
+#
+druid.host=localhost
+
+#
+# Logging
+#
+
+# Log all runtime properties on startup. Disable to avoid logging properties on startup:
+druid.startup.logging.logProperties=true
+
+#
+# Zookeeper
+#
+
+druid.zk.service.host=localhost
+druid.zk.paths.base=/druid
+
+#
+# Metadata storage
+#
+
+# For Derby server on your Druid Coordinator (only viable in a cluster with a single Coordinator, no fail-over):
+druid.metadata.storage.type=derby
+druid.metadata.storage.connector.connectURI=jdbc:derby://localhost:1527/var/druid/metadata.db;create=true
+druid.metadata.storage.connector.host=localhost
+druid.metadata.storage.connector.port=1527
+
+# For MySQL (make sure to include the MySQL JDBC driver on the classpath):
+#druid.metadata.storage.type=mysql
+#druid.metadata.storage.connector.connectURI=jdbc:mysql://db.example.com:3306/druid
+#druid.metadata.storage.connector.user=...
+#druid.metadata.storage.connector.password=...
+
+# For PostgreSQL:
+#druid.metadata.storage.type=postgresql
+#druid.metadata.storage.connector.connectURI=jdbc:postgresql://db.example.com:5432/druid
+#druid.metadata.storage.connector.user=...
+#druid.metadata.storage.connector.password=...
+
+#
+# Deep storage
+#
+
+# For local disk (only viable in a cluster if this is a network mount):
+druid.storage.type=local
+druid.storage.storageDirectory=var/druid/segments
+
+# For HDFS:
+#druid.storage.type=hdfs
+#druid.storage.storageDirectory=/druid/segments
+
+# For S3:
+#druid.storage.type=s3
+#druid.storage.bucket=your-bucket
+#druid.storage.baseKey=druid/segments
+#druid.s3.accessKey=...
+#druid.s3.secretKey=...
+
+#
+# Indexing service logs
+#
+
+# For local disk (only viable in a cluster if this is a network mount):
+druid.indexer.logs.type=file
+druid.indexer.logs.directory=var/druid/indexing-logs
+
+# For HDFS:
+#druid.indexer.logs.type=hdfs
+#druid.indexer.logs.directory=/druid/indexing-logs
+
+# For S3:
+#druid.indexer.logs.type=s3
+#druid.indexer.logs.s3Bucket=your-bucket
+#druid.indexer.logs.s3Prefix=druid/indexing-logs
+
+#
+# Service discovery
+#
+
+druid.selectors.indexing.serviceName=druid/overlord
+druid.selectors.coordinator.serviceName=druid/coordinator
+
+#
+# Monitoring
+#
+
+druid.monitoring.monitors=["org.apache.druid.java.util.metrics.JvmMonitor"]
+druid.emitter=noop
+druid.emitter.logging.logLevel=info
+
+# Storage type of double columns
+# ommiting this will lead to index double as float at the storage layer
+
+druid.indexing.doubleStorage=double
+
+#
+# Security
+#
+druid.server.hiddenProperties=["druid.s3.accessKey","druid.s3.secretKey","druid.metadata.storage.connector.password", "password", "key", "token", "pwd"]
+
+
+#
+# SQL
+#
+druid.sql.enable=true
+
+# Planning SQL query when there is aggregate distinct in the statement
+druid.sql.planner.useGroupingSetForExactDistinct=true
+
+#
+# Lookups
+#
+druid.lookup.enableLookupSyncOnStartup=false
+
+#
+# Expression processing config
+#
+druid.expressions.useStrictBooleans=true
+
+#
+# Http client
+#
+druid.global.http.eagerInitialization=false
diff --git a/examples/conf/druid/auto/_common/log4j2.xml b/examples/conf/druid/auto/_common/log4j2.xml
new file mode 100644
index 000000000000..66dc13da4c5e
--- /dev/null
+++ b/examples/conf/druid/auto/_common/log4j2.xml
@@ -0,0 +1,86 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ ~ Licensed to the Apache Software Foundation (ASF) under one
+ ~ or more contributor license agreements.  See the NOTICE file
+ ~ distributed with this work for additional information
+ ~ regarding copyright ownership.  The ASF licenses this file
+ ~ to you under the Apache License, Version 2.0 (the
+ ~ "License"); you may not use this file except in compliance
+ ~ with the License.  You may obtain a copy of the License at
+ ~
+ ~   http://www.apache.org/licenses/LICENSE-2.0
+ ~
+ ~ Unless required by applicable law or agreed to in writing,
+ ~ software distributed under the License is distributed on an
+ ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ ~ KIND, either express or implied.  See the License for the
+ ~ specific language governing permissions and limitations
+ ~ under the License.
+-->
+
+<Configuration status="WARN">
+  <Properties>
+    <!-- to change log directory, set DRUID_LOG_DIR environment variable to your directory before launching Druid -->
+    <Property name="druid.log.path" value="log" />
+  </Properties>
+
+  <Appenders>
+    <Console name="Console" target="SYSTEM_OUT">
+      <PatternLayout pattern="%d{ISO8601} %p [%t] %c - %m%n"/>
+    </Console>
+
+    <!-- Rolling Files-->
+    <RollingRandomAccessFile name="FileAppender"
+                             fileName="${sys:druid.log.path}/${sys:druid.node.type}.log"
+                             filePattern="${sys:druid.log.path}/${sys:druid.node.type}.%d{yyyyMMdd}.log">
+      <PatternLayout pattern="%d{ISO8601} %p [%t] %c - %m%n"/>
+      <Policies>
+        <TimeBasedTriggeringPolicy interval="1" modulate="true"/>
+      </Policies>
+      <DefaultRolloverStrategy>
+        <Delete basePath="${sys:druid.log.path}/" maxDepth="1">
+          <IfFileName glob="*.log" />
+          <IfLastModified age="7d" />
+        </Delete>
+      </DefaultRolloverStrategy>
+    </RollingRandomAccessFile>
+
+  </Appenders>
+
+  <Loggers>
+    <Root level="info">
+      <AppenderRef ref="FileAppender"/>
+    </Root>
+
+    <!-- Set level="debug" to see stack traces for query errors -->
+    <Logger name="org.apache.druid.server.QueryResource" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+    <Logger name="org.apache.druid.server.QueryLifecycle" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+
+    <!-- Set level="debug" or "trace" to see more Coordinator details (segment balancing, load/drop rules, etc) -->
+    <Logger name="org.apache.druid.server.coordinator" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+
+    <!-- Set level="debug" to see low-level details about segments and ingestion -->
+    <Logger name="org.apache.druid.segment" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+
+    <!-- Set level="debug" to see more information about extension initialization -->
+    <Logger name="org.apache.druid.initialization" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+
+    <!-- Quieter logging at startup -->
+    <Logger name="org.skife.config" level="warn" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+    <Logger name="com.sun.jersey.guice" level="warn" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+  </Loggers>
+</Configuration>
diff --git a/examples/conf/druid/auto/broker/runtime.properties b/examples/conf/druid/auto/broker/runtime.properties
new file mode 100644
index 000000000000..f4c494019933
--- /dev/null
+++ b/examples/conf/druid/auto/broker/runtime.properties
@@ -0,0 +1,41 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+#
+
+druid.service=druid/broker
+druid.plaintextPort=8082
+
+# HTTP server settings
+# HTTP server thread pool size. Higher values increase peak load on the Broker, but
+# may be useful for high-concurrency workloads.
+# Default is max(10, (Number of processors * 17) / 16 + 2) + 30.
+# druid.server.http.numThreads=N
+
+# HTTP client settings
+# Connection pool size from the Broker to each data server. May be useful to
+# raise this for high-concurrency workloads.
+# druid.broker.http.numConnections=20
+
+# Processing threads and buffers
+# Determined automatically based on available memory. For details on how to manually set parameters:
+# https://druid.apache.org/docs/latest/operations/basic-cluster-tuning.html#guidelines-for-processing-threads-and-buffers
+druid.processing.tmpDir=var/druid/processing
+
+# Query cache disabled -- push down caching and merging instead
+druid.broker.cache.useCache=false
+druid.broker.cache.populateCache=false
diff --git a/examples/conf/druid/auto/coordinator-overlord/runtime.properties b/examples/conf/druid/auto/coordinator-overlord/runtime.properties
new file mode 100644
index 000000000000..c053823f8ed8
--- /dev/null
+++ b/examples/conf/druid/auto/coordinator-overlord/runtime.properties
@@ -0,0 +1,33 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+#
+
+druid.service=druid/coordinator
+druid.plaintextPort=8081
+
+druid.coordinator.startDelay=PT10S
+druid.coordinator.period=PT5S
+druid.manager.segments.pollDuration=PT5S
+
+# Run the overlord service in the coordinator process
+druid.coordinator.asOverlord.enabled=true
+druid.coordinator.asOverlord.overlordService=druid/overlord
+
+druid.indexer.queue.startDelay=PT5S
+
+druid.indexer.storage.type=metadata
diff --git a/examples/conf/druid/auto/historical/runtime.properties b/examples/conf/druid/auto/historical/runtime.properties
new file mode 100644
index 000000000000..6c241aa7cf06
--- /dev/null
+++ b/examples/conf/druid/auto/historical/runtime.properties
@@ -0,0 +1,35 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+#
+
+# HTTP server thread pool size. Higher values increase peak load on the Broker, but
+# may be useful for high-concurrency workloads.
+# Default is max(10, (Number of processors * 17) / 16 + 2) + 30.
+# druid.server.http.numThreads=N
+
+# Processing threads and buffers
+# Determined automatically based on available memory. For details on how to manually set parameters:
+# https://druid.apache.org/docs/latest/operations/basic-cluster-tuning.html#guidelines-for-processing-threads-and-buffers
+druid.processing.tmpDir=var/druid/processing
+
+# Segment storage
+druid.segmentCache.locations=[{"path":"var/druid/segment-cache","maxSize":"300g"}]
+# Query cache
+druid.historical.cache.useCache=true
+druid.historical.cache.populateCache=true
+druid.cache.type=caffeine
diff --git a/examples/conf/druid/auto/indexer/runtime.properties b/examples/conf/druid/auto/indexer/runtime.properties
new file mode 100644
index 000000000000..5aef64535b67
--- /dev/null
+++ b/examples/conf/druid/auto/indexer/runtime.properties
@@ -0,0 +1,34 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+#
+
+druid.service=druid/indexer
+druid.plaintextPort=8091
+
+# Number of tasks (druid.worker.capacity) is automatically
+# determined based on available processor.
+
+# Task launch parameters
+druid.indexer.task.baseTaskDir=var/druid/task
+
+# Processing threads and buffers on Indexer
+# Determined automatically based on available memory. For details on how to manually set parameters:
+# https://druid.apache.org/docs/latest/operations/basic-cluster-tuning.html#guidelines-for-processing-threads-and-buffers
+
+# Hadoop indexing
+druid.indexer.task.hadoopWorkingPath=var/druid/hadoop-tmp
diff --git a/examples/conf/druid/auto/middleManager/runtime.properties b/examples/conf/druid/auto/middleManager/runtime.properties
new file mode 100644
index 000000000000..08c58bae6de0
--- /dev/null
+++ b/examples/conf/druid/auto/middleManager/runtime.properties
@@ -0,0 +1,36 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+#
+
+druid.service=druid/middleManager
+druid.plaintextPort=8091
+
+# Number of tasks (druid.worker.capacity) and memory usage per task (druid.indexer.runner.javaOptsArray) is automatically
+# determined based on available memory. For details on how to manually set parameters, see:
+# https://druid.apache.org/docs/latest/operations/basic-cluster-tuning.html#middlemanager
+
+# Task launch parameters
+druid.indexer.runner.javaCommand=bin/run-java
+druid.indexer.task.baseTaskDir=var/druid/task
+
+# Processing threads and buffers on Peons
+# Determined automatically based on available memory. For details on how to manually set parameters:
+# https://druid.apache.org/docs/latest/operations/basic-cluster-tuning.html#guidelines-for-processing-threads-and-buffers
+
+# Hadoop indexing
+druid.indexer.task.hadoopWorkingPath=var/druid/hadoop-tmp
diff --git a/examples/conf/druid/auto/router/runtime.properties b/examples/conf/druid/auto/router/runtime.properties
new file mode 100644
index 000000000000..3858dec044bd
--- /dev/null
+++ b/examples/conf/druid/auto/router/runtime.properties
@@ -0,0 +1,28 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+#
+
+druid.service=druid/router
+druid.plaintextPort=8888
+
+# Service discovery
+druid.router.defaultBrokerServiceName=druid/broker
+druid.router.coordinatorServiceName=druid/coordinator
+
+# Management proxy to coordinator / overlord: required for unified web console.
+druid.router.managementProxy.enabled=true
diff --git a/extendedset/pom.xml b/extendedset/pom.xml
index bdd52ead1656..1927d59cff52 100755
--- a/extendedset/pom.xml
+++ b/extendedset/pom.xml
@@ -31,7 +31,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
   </parent>
 
   <dependencies>
diff --git a/extensions-contrib/aliyun-oss-extensions/pom.xml b/extensions-contrib/aliyun-oss-extensions/pom.xml
index 4fdde743a947..9336122ed5ff 100644
--- a/extensions-contrib/aliyun-oss-extensions/pom.xml
+++ b/extensions-contrib/aliyun-oss-extensions/pom.xml
@@ -28,7 +28,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   
diff --git a/extensions-contrib/ambari-metrics-emitter/pom.xml b/extensions-contrib/ambari-metrics-emitter/pom.xml
index a267edc55485..fc7f73be4a6c 100644
--- a/extensions-contrib/ambari-metrics-emitter/pom.xml
+++ b/extensions-contrib/ambari-metrics-emitter/pom.xml
@@ -24,7 +24,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-contrib/cassandra-storage/pom.xml b/extensions-contrib/cassandra-storage/pom.xml
index d9ed4ccff56b..2dd7d409143e 100644
--- a/extensions-contrib/cassandra-storage/pom.xml
+++ b/extensions-contrib/cassandra-storage/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-contrib/cloudfiles-extensions/pom.xml b/extensions-contrib/cloudfiles-extensions/pom.xml
index 3bd9c3220371..e3c13d1962cc 100644
--- a/extensions-contrib/cloudfiles-extensions/pom.xml
+++ b/extensions-contrib/cloudfiles-extensions/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-contrib/compressed-bigdecimal/pom.xml b/extensions-contrib/compressed-bigdecimal/pom.xml
index a9929c3c949c..f4309fa2d26a 100644
--- a/extensions-contrib/compressed-bigdecimal/pom.xml
+++ b/extensions-contrib/compressed-bigdecimal/pom.xml
@@ -25,7 +25,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalMaxSqlAggregatorTest.java b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalMaxSqlAggregatorTest.java
index fec14699d40c..06709040b645 100644
--- a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalMaxSqlAggregatorTest.java
+++ b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalMaxSqlAggregatorTest.java
@@ -19,23 +19,13 @@
 
 package org.apache.druid.compressedbigdecimal;
 
-import com.google.common.collect.ImmutableSet;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
-
 public class CompressedBigDecimalMaxSqlAggregatorTest extends CompressedBigDecimalSqlAggregatorTestBase
 {
   private static final String FUNCTION_NAME = CompressedBigDecimalMaxSqlAggregator.NAME;
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return new DruidOperatorTable(ImmutableSet.of(new CompressedBigDecimalMaxSqlAggregator()), ImmutableSet.of());
-  }
-
   @Override
   public void testCompressedBigDecimalAggWithNumberParse()
   {
-
     testCompressedBigDecimalAggWithNumberParseHelper(
         FUNCTION_NAME,
         new Object[]{"6.000000000", "6.000000000", "10.100000000"},
diff --git a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalMinSqlAggregatorTest.java b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalMinSqlAggregatorTest.java
index 0031780ee300..3a18dd49652b 100644
--- a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalMinSqlAggregatorTest.java
+++ b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalMinSqlAggregatorTest.java
@@ -19,19 +19,10 @@
 
 package org.apache.druid.compressedbigdecimal;
 
-import com.google.common.collect.ImmutableSet;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
-
 public class CompressedBigDecimalMinSqlAggregatorTest extends CompressedBigDecimalSqlAggregatorTestBase
 {
   private static final String FUNCTION_NAME = CompressedBigDecimalMinSqlAggregator.NAME;
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return new DruidOperatorTable(ImmutableSet.of(new CompressedBigDecimalMinSqlAggregator()), ImmutableSet.of());
-  }
-
   @Override
   public void testCompressedBigDecimalAggWithNumberParse()
   {
diff --git a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorTestBase.java b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorTestBase.java
index 9f661b7d3987..5d1c67c2f38a 100644
--- a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorTestBase.java
+++ b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSqlAggregatorTestBase.java
@@ -20,17 +20,17 @@
 package org.apache.druid.compressedbigdecimal;
 
 import com.fasterxml.jackson.databind.MapperFeature;
-import com.fasterxml.jackson.databind.Module;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.fasterxml.jackson.databind.SerializationFeature;
 import com.google.common.collect.ImmutableList;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.data.input.impl.InputRowParser;
 import org.apache.druid.data.input.impl.MapInputRowParser;
 import org.apache.druid.data.input.impl.TimeAndDimsParseSpec;
 import org.apache.druid.data.input.impl.TimestampSpec;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.query.Druids;
@@ -45,7 +45,6 @@
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
@@ -74,16 +73,17 @@ public abstract class CompressedBigDecimalSqlAggregatorTestBase extends BaseCalc
       TestDataBuilder.RAW_ROWS1.stream().map(m -> TestDataBuilder.createRow(m, PARSER)).collect(Collectors.toList());
 
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    CompressedBigDecimalModule bigDecimalModule = new CompressedBigDecimalModule();
-    return Iterables.concat(super.getJacksonModules(), bigDecimalModule.getJacksonModules());
+    super.configureGuice(builder);
+    builder.addModule(new CompressedBigDecimalModule());
   }
 
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     QueryableIndex index =
@@ -121,9 +121,6 @@ public void configureJsonMapper(ObjectMapper objectMapper)
     objectMapper.configure(MapperFeature.SORT_PROPERTIES_ALPHABETICALLY, true);
   }
 
-  @Override
-  public abstract DruidOperatorTable createOperatorTable();
-
   @Test
   public abstract void testCompressedBigDecimalAggWithNumberParse();
 
@@ -279,5 +276,4 @@ public void testCompressedBigDecimalAggDefaultSizeAndScaleHelper(
         ImmutableList.of(expectedResults)
     );
   }
-
 }
diff --git a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSumSqlAggregatorTest.java b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSumSqlAggregatorTest.java
index c7bc86d15438..db248ef67f0e 100644
--- a/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSumSqlAggregatorTest.java
+++ b/extensions-contrib/compressed-bigdecimal/src/test/java/org/apache/druid/compressedbigdecimal/CompressedBigDecimalSumSqlAggregatorTest.java
@@ -19,19 +19,10 @@
 
 package org.apache.druid.compressedbigdecimal;
 
-import com.google.common.collect.ImmutableSet;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
-
 public class CompressedBigDecimalSumSqlAggregatorTest extends CompressedBigDecimalSqlAggregatorTestBase
 {
   private static final String FUNCTION_NAME = CompressedBigDecimalSumSqlAggregator.NAME;
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return new DruidOperatorTable(ImmutableSet.of(new CompressedBigDecimalSumSqlAggregator()), ImmutableSet.of());
-  }
-
   @Override
   public void testCompressedBigDecimalAggWithNumberParse()
   {
@@ -39,7 +30,6 @@ public void testCompressedBigDecimalAggWithNumberParse()
         FUNCTION_NAME,
         new Object[]{"21.000000000", "21.000000000", "13.100000000"},
         CompressedBigDecimalSumAggregatorFactory::new
-
     );
   }
 
diff --git a/extensions-contrib/distinctcount/pom.xml b/extensions-contrib/distinctcount/pom.xml
index 7dd0b77f69be..35ffdd9510d2 100644
--- a/extensions-contrib/distinctcount/pom.xml
+++ b/extensions-contrib/distinctcount/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-contrib/dropwizard-emitter/pom.xml b/extensions-contrib/dropwizard-emitter/pom.xml
index 714ac2090d9a..0ebe49754660 100644
--- a/extensions-contrib/dropwizard-emitter/pom.xml
+++ b/extensions-contrib/dropwizard-emitter/pom.xml
@@ -24,7 +24,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-contrib/gce-extensions/pom.xml b/extensions-contrib/gce-extensions/pom.xml
index 3a3fb73b1be0..aebb755c0b1d 100644
--- a/extensions-contrib/gce-extensions/pom.xml
+++ b/extensions-contrib/gce-extensions/pom.xml
@@ -21,7 +21,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/graphite-emitter/pom.xml b/extensions-contrib/graphite-emitter/pom.xml
index e44036db513f..44759f8f4653 100644
--- a/extensions-contrib/graphite-emitter/pom.xml
+++ b/extensions-contrib/graphite-emitter/pom.xml
@@ -24,7 +24,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-contrib/influx-extensions/pom.xml b/extensions-contrib/influx-extensions/pom.xml
index 326cea69f81e..aab1f8c05cca 100644
--- a/extensions-contrib/influx-extensions/pom.xml
+++ b/extensions-contrib/influx-extensions/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-contrib/influxdb-emitter/pom.xml b/extensions-contrib/influxdb-emitter/pom.xml
index 01381b799c32..12dc1b34bba8 100644
--- a/extensions-contrib/influxdb-emitter/pom.xml
+++ b/extensions-contrib/influxdb-emitter/pom.xml
@@ -28,7 +28,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-contrib/kafka-emitter/pom.xml b/extensions-contrib/kafka-emitter/pom.xml
index 38ef7efcf5ba..b1f575d9020d 100644
--- a/extensions-contrib/kafka-emitter/pom.xml
+++ b/extensions-contrib/kafka-emitter/pom.xml
@@ -24,7 +24,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-contrib/kubernetes-overlord-extensions/pom.xml b/extensions-contrib/kubernetes-overlord-extensions/pom.xml
index ffd94574111d..9503eeeb6ced 100644
--- a/extensions-contrib/kubernetes-overlord-extensions/pom.xml
+++ b/extensions-contrib/kubernetes-overlord-extensions/pom.xml
@@ -30,7 +30,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-contrib/materialized-view-maintenance/pom.xml b/extensions-contrib/materialized-view-maintenance/pom.xml
index 449d2324aa7c..c8057bc78c57 100644
--- a/extensions-contrib/materialized-view-maintenance/pom.xml
+++ b/extensions-contrib/materialized-view-maintenance/pom.xml
@@ -22,7 +22,7 @@
     <parent>
         <artifactId>druid</artifactId>
         <groupId>org.apache.druid</groupId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
     <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/materialized-view-selection/pom.xml b/extensions-contrib/materialized-view-selection/pom.xml
index c65bccd0bc1b..d23344f1fd02 100644
--- a/extensions-contrib/materialized-view-selection/pom.xml
+++ b/extensions-contrib/materialized-view-selection/pom.xml
@@ -22,7 +22,7 @@
     <parent>
         <artifactId>druid</artifactId>
         <groupId>org.apache.druid</groupId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
     <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/momentsketch/pom.xml b/extensions-contrib/momentsketch/pom.xml
index 1d6afba02d1a..08843ed1669f 100644
--- a/extensions-contrib/momentsketch/pom.xml
+++ b/extensions-contrib/momentsketch/pom.xml
@@ -22,7 +22,7 @@
     <parent>
         <artifactId>druid</artifactId>
         <groupId>org.apache.druid</groupId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
     <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/moving-average-query/pom.xml b/extensions-contrib/moving-average-query/pom.xml
index d53c79b3f963..f686cdfc6a4e 100644
--- a/extensions-contrib/moving-average-query/pom.xml
+++ b/extensions-contrib/moving-average-query/pom.xml
@@ -24,7 +24,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-contrib/opentelemetry-emitter/pom.xml b/extensions-contrib/opentelemetry-emitter/pom.xml
index 5a1c4027e7be..8bdb7b3dd5d8 100644
--- a/extensions-contrib/opentelemetry-emitter/pom.xml
+++ b/extensions-contrib/opentelemetry-emitter/pom.xml
@@ -23,7 +23,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/opentsdb-emitter/pom.xml b/extensions-contrib/opentsdb-emitter/pom.xml
index 18fd9c61442d..2d68ecf1bca9 100644
--- a/extensions-contrib/opentsdb-emitter/pom.xml
+++ b/extensions-contrib/opentsdb-emitter/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-contrib/prometheus-emitter/pom.xml b/extensions-contrib/prometheus-emitter/pom.xml
index 63e7fba6d528..8d5b13aa7281 100644
--- a/extensions-contrib/prometheus-emitter/pom.xml
+++ b/extensions-contrib/prometheus-emitter/pom.xml
@@ -23,7 +23,7 @@
   <parent>
     <artifactId>druid</artifactId>
     <groupId>org.apache.druid</groupId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/redis-cache/pom.xml b/extensions-contrib/redis-cache/pom.xml
index f7ec74e8b28b..e6551e6b792b 100644
--- a/extensions-contrib/redis-cache/pom.xml
+++ b/extensions-contrib/redis-cache/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-contrib/sqlserver-metadata-storage/pom.xml b/extensions-contrib/sqlserver-metadata-storage/pom.xml
index 67c78fbb81c6..388f40cb2955 100644
--- a/extensions-contrib/sqlserver-metadata-storage/pom.xml
+++ b/extensions-contrib/sqlserver-metadata-storage/pom.xml
@@ -28,7 +28,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-contrib/statsd-emitter/pom.xml b/extensions-contrib/statsd-emitter/pom.xml
index e4aad827e271..ea0f5ba231e9 100644
--- a/extensions-contrib/statsd-emitter/pom.xml
+++ b/extensions-contrib/statsd-emitter/pom.xml
@@ -21,7 +21,7 @@
   <parent>
     <artifactId>druid</artifactId>
     <groupId>org.apache.druid</groupId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/tdigestsketch/pom.xml b/extensions-contrib/tdigestsketch/pom.xml
index 7d271fb06708..76cf7b4055d0 100644
--- a/extensions-contrib/tdigestsketch/pom.xml
+++ b/extensions-contrib/tdigestsketch/pom.xml
@@ -22,7 +22,7 @@
   <parent>
     <artifactId>druid</artifactId>
     <groupId>org.apache.druid</groupId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/tdigestsketch/src/test/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestSketchSqlAggregatorTest.java b/extensions-contrib/tdigestsketch/src/test/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestSketchSqlAggregatorTest.java
index ae8c5bfe4683..b304dba196a3 100644
--- a/extensions-contrib/tdigestsketch/src/test/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestSketchSqlAggregatorTest.java
+++ b/extensions-contrib/tdigestsketch/src/test/java/org/apache/druid/query/aggregation/tdigestsketch/sql/TDigestSketchSqlAggregatorTest.java
@@ -19,11 +19,10 @@
 
 package org.apache.druid.query.aggregation.tdigestsketch.sql;
 
-import com.fasterxml.jackson.databind.Module;
 import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.Druids;
@@ -50,7 +49,6 @@
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
@@ -64,21 +62,18 @@
 
 public class TDigestSketchSqlAggregatorTest extends BaseCalciteQueryTest
 {
-  private static final DruidOperatorTable OPERATOR_TABLE = new DruidOperatorTable(
-      ImmutableSet.of(new TDigestSketchQuantileSqlAggregator(), new TDigestGenerateSketchSqlAggregator()),
-      ImmutableSet.of()
-  );
-
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    return Iterables.concat(super.getJacksonModules(), new TDigestSketchModule().getJacksonModules());
+    super.configureGuice(builder);
+    builder.addModule(new TDigestSketchModule());
   }
 
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     TDigestSketchModule.registerSerde();
@@ -116,12 +111,6 @@ public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
     );
   }
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return OPERATOR_TABLE;
-  }
-
   @Test
   public void testComputingSketchOnNumericValues()
   {
diff --git a/extensions-contrib/thrift-extensions/pom.xml b/extensions-contrib/thrift-extensions/pom.xml
index 70aef1f61a93..5d61693a2868 100644
--- a/extensions-contrib/thrift-extensions/pom.xml
+++ b/extensions-contrib/thrift-extensions/pom.xml
@@ -28,7 +28,7 @@
   <parent>
     <artifactId>druid</artifactId>
     <groupId>org.apache.druid</groupId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/time-min-max/pom.xml b/extensions-contrib/time-min-max/pom.xml
index a11c79367930..d4767a94f30a 100644
--- a/extensions-contrib/time-min-max/pom.xml
+++ b/extensions-contrib/time-min-max/pom.xml
@@ -21,7 +21,7 @@
   <parent>
     <artifactId>druid</artifactId>
     <groupId>org.apache.druid</groupId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-contrib/virtual-columns/pom.xml b/extensions-contrib/virtual-columns/pom.xml
index abdc8606e45d..7ae88be798cf 100644
--- a/extensions-contrib/virtual-columns/pom.xml
+++ b/extensions-contrib/virtual-columns/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/avro-extensions/pom.xml b/extensions-core/avro-extensions/pom.xml
index fcabcd7c9daa..53dff82a980c 100644
--- a/extensions-core/avro-extensions/pom.xml
+++ b/extensions-core/avro-extensions/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
@@ -254,6 +254,11 @@
       <artifactId>mockito-core</artifactId>
       <scope>test</scope>
     </dependency>
+    <dependency>
+      <groupId>org.hamcrest</groupId>
+      <artifactId>hamcrest-core</artifactId>
+      <scope>test</scope>
+    </dependency>
     <dependency>
       <groupId>org.apache.druid</groupId>
       <artifactId>druid-core</artifactId>
diff --git a/extensions-core/avro-extensions/src/main/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoder.java b/extensions-core/avro-extensions/src/main/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoder.java
index f7006cb02c21..05c5c9fec2fe 100644
--- a/extensions-core/avro-extensions/src/main/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoder.java
+++ b/extensions-core/avro-extensions/src/main/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoder.java
@@ -140,17 +140,17 @@ public GenericRecord parse(ByteBuffer bytes)
       schema = parsedSchema instanceof AvroSchema ? ((AvroSchema) parsedSchema).rawSchema() : null;
     }
     catch (IOException | RestClientException ex) {
-      throw new ParseException(null, "Failed to get Avro schema: %s", id);
+      throw new ParseException(null, ex, "Failed to fetch Avro schema from registry: %s", id);
     }
     if (schema == null) {
-      throw new ParseException(null, "Failed to find Avro schema: %s", id);
+      throw new ParseException(null, "No Avro schema in registry: %s", id);
     }
     DatumReader<GenericRecord> reader = new GenericDatumReader<>(schema);
     try {
       return reader.read(null, DecoderFactory.get().binaryDecoder(bytes.array(), offset, length, null));
     }
     catch (Exception e) {
-      throw new ParseException(null, e, "Fail to decode Avro message for schema: %s!", id);
+      throw new ParseException(null, e, "Failed to decode Avro message for schema: %s", id);
     }
   }
 
diff --git a/extensions-core/avro-extensions/src/test/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoderTest.java b/extensions-core/avro-extensions/src/test/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoderTest.java
index 9348e9486aef..7644b61bb106 100644
--- a/extensions-core/avro-extensions/src/test/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoderTest.java
+++ b/extensions-core/avro-extensions/src/test/java/org/apache/druid/data/input/avro/SchemaRegistryBasedAvroBytesDecoderTest.java
@@ -35,6 +35,8 @@
 import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.parsers.ParseException;
 import org.apache.druid.utils.DynamicConfigProviderUtils;
+import org.hamcrest.CoreMatchers;
+import org.hamcrest.MatcherAssert;
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Test;
@@ -158,7 +160,7 @@ public void testParseWrongSchemaType() throws Exception
     new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb);
   }
 
-  @Test(expected = ParseException.class)
+  @Test
   public void testParseWrongId() throws Exception
   {
     // Given
@@ -166,7 +168,12 @@ public void testParseWrongId() throws Exception
     ByteBuffer bb = ByteBuffer.allocate(5).put((byte) 0).putInt(1234);
     bb.rewind();
     // When
-    new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb);
+    final ParseException e = Assert.assertThrows(
+        ParseException.class,
+        () -> new SchemaRegistryBasedAvroBytesDecoder(registry).parse(bb)
+    );
+    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(IOException.class));
+    MatcherAssert.assertThat(e.getCause().getMessage(), CoreMatchers.containsString("no pasaran"));
   }
 
   private byte[] getAvroDatum(Schema schema, GenericRecord someAvroDatum) throws IOException
diff --git a/extensions-core/azure-extensions/pom.xml b/extensions-core/azure-extensions/pom.xml
index 6a01cea8a316..e34bacbe69ef 100644
--- a/extensions-core/azure-extensions/pom.xml
+++ b/extensions-core/azure-extensions/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/datasketches/pom.xml b/extensions-core/datasketches/pom.xml
index a37efd2dc215..83101d2e7c01 100644
--- a/extensions-core/datasketches/pom.xml
+++ b/extensions-core/datasketches/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchMergeComplexMetricSerde.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchMergeComplexMetricSerde.java
index c8ac48ab186e..1063bbdfec1a 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchMergeComplexMetricSerde.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchMergeComplexMetricSerde.java
@@ -28,6 +28,7 @@
 import org.apache.druid.segment.column.ColumnBuilder;
 import org.apache.druid.segment.data.GenericIndexed;
 import org.apache.druid.segment.data.ObjectStrategy;
+import org.apache.druid.segment.data.SafeWritableMemory;
 import org.apache.druid.segment.serde.ComplexColumnPartSupplier;
 import org.apache.druid.segment.serde.ComplexMetricExtractor;
 import org.apache.druid.segment.serde.ComplexMetricSerde;
@@ -70,7 +71,7 @@ public HllSketch extractValue(final InputRow inputRow, final String metricName)
         if (object == null) {
           return null;
         }
-        return deserializeSketch(object);
+        return deserializeSketchSafe(object);
       }
     };
   }
@@ -98,6 +99,18 @@ static HllSketch deserializeSketch(final Object object)
     throw new IAE("Object is not of a type that can be deserialized to an HllSketch:" + object.getClass().getName());
   }
 
+  static HllSketch deserializeSketchSafe(final Object object)
+  {
+    if (object instanceof String) {
+      return HllSketch.wrap(SafeWritableMemory.wrap(StringUtils.decodeBase64(((String) object).getBytes(StandardCharsets.UTF_8))));
+    } else if (object instanceof byte[]) {
+      return HllSketch.wrap(SafeWritableMemory.wrap((byte[]) object));
+    } else if (object instanceof HllSketch) {
+      return (HllSketch) object;
+    }
+    throw new IAE("Object is not of a type that can be deserialized to an HllSketch:" + object.getClass().getName());
+  }
+
   // support large columns
   @Override
   public GenericColumnSerializer getSerializer(final SegmentWriteOutMedium segmentWriteOutMedium, final String column)
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchModule.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchModule.java
index 5044068262d8..2a07c70ec639 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchModule.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchModule.java
@@ -44,7 +44,6 @@
  */
 public class HllSketchModule implements DruidModule
 {
-
   public static final String TYPE_NAME = "HLLSketch"; // common type name to be associated with segment data
   public static final String BUILD_TYPE_NAME = "HLLSketchBuild";
   public static final String MERGE_TYPE_NAME = "HLLSketchMerge";
@@ -53,7 +52,6 @@ public class HllSketchModule implements DruidModule
   public static final String ESTIMATE_WITH_BOUNDS_TYPE_NAME = "HLLSketchEstimateWithBounds";
   public static final String ESTIMATE_TYPE_NAME = "HLLSketchEstimate";
 
-
   @Override
   public void configure(final Binder binder)
   {
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchObjectStrategy.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchObjectStrategy.java
index 34145863fdf8..65257b22b796 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchObjectStrategy.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchObjectStrategy.java
@@ -22,7 +22,9 @@
 import org.apache.datasketches.hll.HllSketch;
 import org.apache.datasketches.memory.Memory;
 import org.apache.druid.segment.data.ObjectStrategy;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
+import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
 import java.nio.ByteOrder;
 
@@ -55,4 +57,12 @@ public byte[] toBytes(final HllSketch sketch)
     return sketch.toCompactByteArray();
   }
 
+  @Nullable
+  @Override
+  public HllSketch fromByteBufferSafe(ByteBuffer buffer, int numBytes)
+  {
+    return HllSketch.wrap(
+        SafeWritableMemory.wrap(buffer, ByteOrder.LITTLE_ENDIAN).region(buffer.position(), numBytes)
+    );
+  }
 }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchComplexMetricSerde.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchComplexMetricSerde.java
index 4c18a9785607..e5249853ac34 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchComplexMetricSerde.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchComplexMetricSerde.java
@@ -91,7 +91,7 @@ public Object extractValue(final InputRow inputRow, final String metricName)
         if (object == null || object instanceof KllDoublesSketch || object instanceof Memory) {
           return object;
         }
-        return KllDoublesSketchOperations.deserialize(object);
+        return KllDoublesSketchOperations.deserializeSafe(object);
       }
     };
   }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchObjectStrategy.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchObjectStrategy.java
index 97e670a625a5..17cb94e2fcf8 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchObjectStrategy.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchObjectStrategy.java
@@ -23,7 +23,9 @@
 import org.apache.datasketches.kll.KllDoublesSketch;
 import org.apache.datasketches.memory.Memory;
 import org.apache.druid.segment.data.ObjectStrategy;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
+import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
 import java.nio.ByteOrder;
 
@@ -60,4 +62,15 @@ public byte[] toBytes(final KllDoublesSketch sketch)
     return sketch.toByteArray();
   }
 
+  @Nullable
+  @Override
+  public KllDoublesSketch fromByteBufferSafe(ByteBuffer buffer, int numBytes)
+  {
+    if (numBytes == 0) {
+      return KllDoublesSketchOperations.EMPTY_SKETCH;
+    }
+    return KllDoublesSketch.wrap(
+        SafeWritableMemory.wrap(buffer, ByteOrder.LITTLE_ENDIAN).region(buffer.position(), numBytes)
+    );
+  }
 }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchOperations.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchOperations.java
index 57cb51747101..6da454d7f868 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchOperations.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchOperations.java
@@ -23,6 +23,7 @@
 import org.apache.datasketches.memory.Memory;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
 import java.nio.charset.StandardCharsets;
 
@@ -46,6 +47,16 @@ public static KllDoublesSketch deserialize(final Object serializedSketch)
     );
   }
 
+  public static KllDoublesSketch deserializeSafe(final Object serializedSketch)
+  {
+    if (serializedSketch instanceof String) {
+      return deserializeFromBase64EncodedStringSafe((String) serializedSketch);
+    } else if (serializedSketch instanceof byte[]) {
+      return deserializeFromByteArraySafe((byte[]) serializedSketch);
+    }
+    return deserialize(serializedSketch);
+  }
+
   public static KllDoublesSketch deserializeFromBase64EncodedString(final String str)
   {
     return deserializeFromByteArray(StringUtils.decodeBase64(str.getBytes(StandardCharsets.UTF_8)));
@@ -56,4 +67,14 @@ public static KllDoublesSketch deserializeFromByteArray(final byte[] data)
     return KllDoublesSketch.wrap(Memory.wrap(data));
   }
 
+  public static KllDoublesSketch deserializeFromBase64EncodedStringSafe(final String str)
+  {
+    return deserializeFromByteArraySafe(StringUtils.decodeBase64(str.getBytes(StandardCharsets.UTF_8)));
+  }
+
+  public static KllDoublesSketch deserializeFromByteArraySafe(final byte[] data)
+  {
+    return KllDoublesSketch.wrap(SafeWritableMemory.wrap(data));
+  }
+
 }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchComplexMetricSerde.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchComplexMetricSerde.java
index 4a71befe0c66..175b307ec33e 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchComplexMetricSerde.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchComplexMetricSerde.java
@@ -91,7 +91,7 @@ public Object extractValue(final InputRow inputRow, final String metricName)
         if (object == null || object instanceof KllFloatsSketch || object instanceof Memory) {
           return object;
         }
-        return KllFloatsSketchOperations.deserialize(object);
+        return KllFloatsSketchOperations.deserializeSafe(object);
       }
     };
   }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchObjectStrategy.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchObjectStrategy.java
index ff177a2f54f1..93ff0a7dba52 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchObjectStrategy.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchObjectStrategy.java
@@ -23,7 +23,9 @@
 import org.apache.datasketches.kll.KllFloatsSketch;
 import org.apache.datasketches.memory.Memory;
 import org.apache.druid.segment.data.ObjectStrategy;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
+import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
 import java.nio.ByteOrder;
 
@@ -60,4 +62,15 @@ public byte[] toBytes(final KllFloatsSketch sketch)
     return sketch.toByteArray();
   }
 
+  @Nullable
+  @Override
+  public KllFloatsSketch fromByteBufferSafe(ByteBuffer buffer, int numBytes)
+  {
+    if (numBytes == 0) {
+      return KllFloatsSketchOperations.EMPTY_SKETCH;
+    }
+    return KllFloatsSketch.wrap(
+        SafeWritableMemory.wrap(buffer, ByteOrder.LITTLE_ENDIAN).region(buffer.position(), numBytes)
+    );
+  }
 }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchOperations.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchOperations.java
index e32b67b2549a..02fb615da4dc 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchOperations.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchOperations.java
@@ -23,6 +23,7 @@
 import org.apache.datasketches.memory.Memory;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
 import java.nio.charset.StandardCharsets;
 
@@ -46,6 +47,16 @@ public static KllFloatsSketch deserialize(final Object serializedSketch)
     );
   }
 
+  public static KllFloatsSketch deserializeSafe(final Object serializedSketch)
+  {
+    if (serializedSketch instanceof String) {
+      return deserializeFromBase64EncodedStringSafe((String) serializedSketch);
+    } else if (serializedSketch instanceof byte[]) {
+      return deserializeFromByteArraySafe((byte[]) serializedSketch);
+    }
+    return deserialize(serializedSketch);
+  }
+
   public static KllFloatsSketch deserializeFromBase64EncodedString(final String str)
   {
     return deserializeFromByteArray(StringUtils.decodeBase64(str.getBytes(StandardCharsets.UTF_8)));
@@ -56,4 +67,14 @@ public static KllFloatsSketch deserializeFromByteArray(final byte[] data)
     return KllFloatsSketch.wrap(Memory.wrap(data));
   }
 
+  public static KllFloatsSketch deserializeFromBase64EncodedStringSafe(final String str)
+  {
+    return deserializeFromByteArraySafe(StringUtils.decodeBase64(str.getBytes(StandardCharsets.UTF_8)));
+  }
+
+  public static KllFloatsSketch deserializeFromByteArraySafe(final byte[] data)
+  {
+    return KllFloatsSketch.wrap(SafeWritableMemory.wrap(data));
+  }
+
 }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchComplexMetricSerde.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchComplexMetricSerde.java
index d97b5f8c6dd3..3614f214c708 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchComplexMetricSerde.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchComplexMetricSerde.java
@@ -92,7 +92,7 @@ public Object extractValue(final InputRow inputRow, final String metricName)
         if (object == null || object instanceof DoublesSketch || object instanceof Memory) {
           return object;
         }
-        return DoublesSketchOperations.deserialize(object);
+        return DoublesSketchOperations.deserializeSafe(object);
       }
     };
   }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchModule.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchModule.java
index cd047695f45d..7896e1c55c10 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchModule.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchModule.java
@@ -43,7 +43,6 @@
 
 public class DoublesSketchModule implements DruidModule
 {
-
   public static final String DOUBLES_SKETCH = "quantilesDoublesSketch";
   public static final String DOUBLES_SKETCH_MERGE = "quantilesDoublesSketchMerge";
   public static final ColumnType TYPE = ColumnType.ofComplex(DOUBLES_SKETCH);
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchObjectStrategy.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchObjectStrategy.java
index 826de9378f8c..569b60bf03f7 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchObjectStrategy.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchObjectStrategy.java
@@ -23,7 +23,9 @@
 import org.apache.datasketches.memory.Memory;
 import org.apache.datasketches.quantiles.DoublesSketch;
 import org.apache.druid.segment.data.ObjectStrategy;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
+import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
 import java.nio.ByteOrder;
 
@@ -60,4 +62,15 @@ public byte[] toBytes(final DoublesSketch sketch)
     return sketch.toByteArray(true);
   }
 
+  @Nullable
+  @Override
+  public DoublesSketch fromByteBufferSafe(ByteBuffer buffer, int numBytes)
+  {
+    if (numBytes == 0) {
+      return DoublesSketchOperations.EMPTY_SKETCH;
+    }
+    return DoublesSketch.wrap(
+        SafeWritableMemory.wrap(buffer, ByteOrder.LITTLE_ENDIAN).region(buffer.position(), numBytes)
+    );
+  }
 }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchOperations.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchOperations.java
index e30fb9bdae83..a2ca197c11ac 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchOperations.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchOperations.java
@@ -23,6 +23,7 @@
 import org.apache.datasketches.quantiles.DoublesSketch;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
 import java.nio.charset.StandardCharsets;
 
@@ -46,6 +47,16 @@ public static DoublesSketch deserialize(final Object serializedSketch)
     );
   }
 
+  public static DoublesSketch deserializeSafe(final Object serializedSketch)
+  {
+    if (serializedSketch instanceof String) {
+      return deserializeFromBase64EncodedStringSafe((String) serializedSketch);
+    } else if (serializedSketch instanceof byte[]) {
+      return deserializeFromByteArraySafe((byte[]) serializedSketch);
+    }
+    return deserialize(serializedSketch);
+  }
+
   public static DoublesSketch deserializeFromBase64EncodedString(final String str)
   {
     return deserializeFromByteArray(StringUtils.decodeBase64(str.getBytes(StandardCharsets.UTF_8)));
@@ -56,4 +67,13 @@ public static DoublesSketch deserializeFromByteArray(final byte[] data)
     return DoublesSketch.wrap(Memory.wrap(data));
   }
 
+  public static DoublesSketch deserializeFromBase64EncodedStringSafe(final String str)
+  {
+    return deserializeFromByteArraySafe(StringUtils.decodeBase64(str.getBytes(StandardCharsets.UTF_8)));
+  }
+
+  public static DoublesSketch deserializeFromByteArraySafe(final byte[] data)
+  {
+    return DoublesSketch.wrap(SafeWritableMemory.wrap(data));
+  }
 }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchConstantPostAggregator.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchConstantPostAggregator.java
index b3541bd50649..64c182a0d62a 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchConstantPostAggregator.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchConstantPostAggregator.java
@@ -51,7 +51,7 @@ public SketchConstantPostAggregator(@JsonProperty("name") String name, @JsonProp
     Preconditions.checkArgument(value != null && !value.isEmpty(),
         "Constant value cannot be null or empty, expecting base64 encoded sketch string");
     this.value = value;
-    this.sketchValue = SketchHolder.deserialize(value);
+    this.sketchValue = SketchHolder.deserializeSafe(value);
   }
 
   @Override
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolder.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolder.java
index 59ca453bb25a..838b4ae91f0f 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolder.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolder.java
@@ -34,6 +34,7 @@
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
 import javax.annotation.Nullable;
 
@@ -224,6 +225,17 @@ public static SketchHolder deserialize(Object serializedSketch)
     );
   }
 
+  public static SketchHolder deserializeSafe(Object serializedSketch)
+  {
+    if (serializedSketch instanceof String) {
+      return SketchHolder.of(deserializeFromBase64EncodedStringSafe((String) serializedSketch));
+    } else if (serializedSketch instanceof byte[]) {
+      return SketchHolder.of(deserializeFromByteArraySafe((byte[]) serializedSketch));
+    }
+
+    return deserialize(serializedSketch);
+  }
+
   private static Sketch deserializeFromBase64EncodedString(String str)
   {
     return deserializeFromByteArray(StringUtils.decodeBase64(StringUtils.toUtf8(str)));
@@ -234,6 +246,16 @@ private static Sketch deserializeFromByteArray(byte[] data)
     return deserializeFromMemory(Memory.wrap(data));
   }
 
+  private static Sketch deserializeFromBase64EncodedStringSafe(String str)
+  {
+    return deserializeFromByteArraySafe(StringUtils.decodeBase64(StringUtils.toUtf8(str)));
+  }
+
+  private static Sketch deserializeFromByteArraySafe(byte[] data)
+  {
+    return deserializeFromMemory(SafeWritableMemory.wrap(data));
+  }
+
   private static Sketch deserializeFromMemory(Memory mem)
   {
     if (Sketch.getSerializationVersion(mem) < 3) {
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderObjectStrategy.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderObjectStrategy.java
index e98bc3d95a04..96fafe826211 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderObjectStrategy.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderObjectStrategy.java
@@ -23,6 +23,7 @@
 import org.apache.datasketches.memory.Memory;
 import org.apache.datasketches.theta.Sketch;
 import org.apache.druid.segment.data.ObjectStrategy;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
 import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
@@ -66,4 +67,17 @@ public byte[] toBytes(@Nullable SketchHolder obj)
       return ByteArrays.EMPTY_ARRAY;
     }
   }
+
+  @Nullable
+  @Override
+  public SketchHolder fromByteBufferSafe(ByteBuffer buffer, int numBytes)
+  {
+    if (numBytes == 0) {
+      return SketchHolder.EMPTY;
+    }
+
+    return SketchHolder.of(
+        SafeWritableMemory.wrap(buffer, ByteOrder.LITTLE_ENDIAN).region(buffer.position(), numBytes)
+    );
+  }
 }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchMergeComplexMetricSerde.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchMergeComplexMetricSerde.java
index a824312c0ef7..4f3ecfae2915 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchMergeComplexMetricSerde.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/SketchMergeComplexMetricSerde.java
@@ -59,7 +59,7 @@ public Class<SketchHolder> extractedClass()
       public SketchHolder extractValue(InputRow inputRow, String metricName)
       {
         final Object object = inputRow.getRaw(metricName);
-        return object == null ? null : SketchHolder.deserialize(object);
+        return object == null ? null : SketchHolder.deserializeSafe(object);
       }
     };
   }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/sql/ThetaSketchSetBaseOperatorConversion.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/sql/ThetaSketchSetBaseOperatorConversion.java
index 0afad6cbe6b1..62c686cd2b2a 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/sql/ThetaSketchSetBaseOperatorConversion.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/theta/sql/ThetaSketchSetBaseOperatorConversion.java
@@ -63,6 +63,8 @@ public DruidExpression toDruidExpression(
       RexNode rexNode
   )
   {
+    plannerContext.setPlanningError("%s can only be used on aggregates. " +
+        "It cannot be used directly on a column or on a scalar expression.", getFunctionName());
     return null;
   }
 
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchMergeComplexMetricSerde.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchMergeComplexMetricSerde.java
index 19c8da292b4e..028bcdc35491 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchMergeComplexMetricSerde.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchMergeComplexMetricSerde.java
@@ -60,7 +60,7 @@ public Object extractValue(final InputRow inputRow, final String metricName)
         if (object == null || object instanceof ArrayOfDoublesSketch) {
           return object;
         }
-        return ArrayOfDoublesSketchOperations.deserialize(object);
+        return ArrayOfDoublesSketchOperations.deserializeSafe(object);
       }
     };
   }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchObjectStrategy.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchObjectStrategy.java
index 1ae950e068f8..f893c83b5707 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchObjectStrategy.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchObjectStrategy.java
@@ -23,6 +23,7 @@
 import org.apache.datasketches.tuple.arrayofdoubles.ArrayOfDoublesSketch;
 import org.apache.datasketches.tuple.arrayofdoubles.ArrayOfDoublesSketches;
 import org.apache.druid.segment.data.ObjectStrategy;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
 import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
@@ -48,7 +49,9 @@ public Class<ArrayOfDoublesSketch> getClazz()
   @Override
   public ArrayOfDoublesSketch fromByteBuffer(final ByteBuffer buffer, final int numBytes)
   {
-    return ArrayOfDoublesSketches.wrapSketch(Memory.wrap(buffer, ByteOrder.LITTLE_ENDIAN).region(buffer.position(), numBytes));
+    return ArrayOfDoublesSketches.wrapSketch(
+        Memory.wrap(buffer, ByteOrder.LITTLE_ENDIAN).region(buffer.position(), numBytes)
+    );
   }
 
   @Override
@@ -61,4 +64,12 @@ public byte[] toBytes(@Nullable final ArrayOfDoublesSketch sketch)
     return sketch.toByteArray();
   }
 
+  @Nullable
+  @Override
+  public ArrayOfDoublesSketch fromByteBufferSafe(ByteBuffer buffer, int numBytes)
+  {
+    return ArrayOfDoublesSketches.wrapSketch(
+        SafeWritableMemory.wrap(buffer, ByteOrder.LITTLE_ENDIAN).region(buffer.position(), numBytes)
+    );
+  }
 }
diff --git a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchOperations.java b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchOperations.java
index b1658a995714..2768858ffe32 100644
--- a/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchOperations.java
+++ b/extensions-core/datasketches/src/main/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchOperations.java
@@ -30,6 +30,7 @@
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.segment.data.SafeWritableMemory;
 
 import java.nio.charset.StandardCharsets;
 
@@ -115,6 +116,17 @@ public static ArrayOfDoublesSketch deserialize(final Object serializedSketch)
     throw new ISE("Object is not of a type that can deserialize to sketch: %s", serializedSketch.getClass());
   }
 
+  public static ArrayOfDoublesSketch deserializeSafe(final Object serializedSketch)
+  {
+    if (serializedSketch instanceof String) {
+      return deserializeFromBase64EncodedStringSafe((String) serializedSketch);
+    } else if (serializedSketch instanceof byte[]) {
+      return deserializeFromByteArraySafe((byte[]) serializedSketch);
+    }
+
+    return deserialize(serializedSketch);
+  }
+
   public static ArrayOfDoublesSketch deserializeFromBase64EncodedString(final String str)
   {
     return deserializeFromByteArray(StringUtils.decodeBase64(str.getBytes(StandardCharsets.UTF_8)));
@@ -122,8 +134,16 @@ public static ArrayOfDoublesSketch deserializeFromBase64EncodedString(final Stri
 
   public static ArrayOfDoublesSketch deserializeFromByteArray(final byte[] data)
   {
-    final Memory mem = Memory.wrap(data);
-    return ArrayOfDoublesSketches.wrapSketch(mem);
+    return ArrayOfDoublesSketches.wrapSketch(Memory.wrap(data));
+  }
+
+  public static ArrayOfDoublesSketch deserializeFromBase64EncodedStringSafe(final String str)
+  {
+    return deserializeFromByteArraySafe(StringUtils.decodeBase64(str.getBytes(StandardCharsets.UTF_8)));
   }
 
+  public static ArrayOfDoublesSketch deserializeFromByteArraySafe(final byte[] data)
+  {
+    return ArrayOfDoublesSketches.wrapSketch(SafeWritableMemory.wrap(data));
+  }
 }
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchObjectStrategyTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchObjectStrategyTest.java
new file mode 100644
index 000000000000..ff1eb947408e
--- /dev/null
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/hll/HllSketchObjectStrategyTest.java
@@ -0,0 +1,77 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.aggregation.datasketches.hll;
+
+import org.apache.datasketches.SketchesArgumentException;
+import org.apache.datasketches.hll.HllSketch;
+import org.apache.druid.java.util.common.StringUtils;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
+public class HllSketchObjectStrategyTest
+{
+  @Test
+  public void testSafeRead()
+  {
+    HllSketch sketch = new HllSketch();
+    sketch.update(new int[]{1, 2, 3});
+
+    final byte[] bytes = sketch.toCompactByteArray();
+
+    ByteBuffer buf = ByteBuffer.wrap(bytes).order(ByteOrder.LITTLE_ENDIAN);
+    HllSketchObjectStrategy objectStrategy = new HllSketchObjectStrategy();
+
+    // valid sketch should not explode when copied, which reads the memory
+    objectStrategy.fromByteBufferSafe(buf, bytes.length).copy();
+
+    // corrupted sketch should fail with a regular java buffer exception
+    for (int subset = 3; subset < bytes.length - 1; subset++) {
+      final byte[] garbage2 = new byte[subset];
+      for (int i = 0; i < garbage2.length; i++) {
+        garbage2[i] = buf.get(i);
+      }
+
+      final ByteBuffer buf2 = ByteBuffer.wrap(garbage2).order(ByteOrder.LITTLE_ENDIAN);
+      Assert.assertThrows(
+          IndexOutOfBoundsException.class,
+          () -> objectStrategy.fromByteBufferSafe(buf2, garbage2.length).copy()
+      );
+    }
+
+    // non sketch that is too short to contain header should fail with regular java buffer exception
+    final byte[] garbage = new byte[]{0x01, 0x02};
+    final ByteBuffer buf3 = ByteBuffer.wrap(garbage).order(ByteOrder.LITTLE_ENDIAN);
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> objectStrategy.fromByteBufferSafe(buf3, garbage.length).copy()
+    );
+
+    // non sketch that is long enough to check (this one doesn't actually need 'safe' read)
+    final byte[] garbageLonger = StringUtils.toUtf8("notasketch");
+    final ByteBuffer buf4 = ByteBuffer.wrap(garbageLonger).order(ByteOrder.LITTLE_ENDIAN);
+    Assert.assertThrows(
+        SketchesArgumentException.class,
+        () -> objectStrategy.fromByteBufferSafe(buf4, garbageLonger.length).copy()
+    );
+  }
+}
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/hll/sql/HllSketchSqlAggregatorTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/hll/sql/HllSketchSqlAggregatorTest.java
index 86e76ca8c219..aa0e9afd13a1 100644
--- a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/hll/sql/HllSketchSqlAggregatorTest.java
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/hll/sql/HllSketchSqlAggregatorTest.java
@@ -19,12 +19,11 @@
 
 package org.apache.druid.query.aggregation.datasketches.hll.sql;
 
-import com.fasterxml.jackson.databind.Module;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.java.util.common.granularity.PeriodGranularity;
@@ -61,13 +60,11 @@
 import org.apache.druid.segment.virtual.ExpressionVirtualColumn;
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
-import org.apache.druid.sql.calcite.aggregation.ApproxCountDistinctSqlAggregator;
-import org.apache.druid.sql.calcite.aggregation.builtin.CountSqlAggregator;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
+import org.apache.druid.sql.guice.SqlModule;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.partition.LinearShardSpec;
 import org.joda.time.DateTimeZone;
@@ -78,22 +75,34 @@
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.List;
+import java.util.Properties;
 
 public class HllSketchSqlAggregatorTest extends BaseCalciteQueryTest
 {
   private static final boolean ROUND = true;
 
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void gatherProperties(Properties properties)
   {
-    return Iterables.concat(super.getJacksonModules(), new HllSketchModule().getJacksonModules());
+    super.gatherProperties(properties);
+
+    // Use APPROX_COUNT_DISTINCT_DS_HLL as APPROX_COUNT_DISTINCT impl for these tests.
+    properties.put(SqlModule.PROPERTY_SQL_APPROX_COUNT_DISTINCT_CHOICE, HllSketchApproxCountDistinctSqlAggregator.NAME);
+  }
+
+  @Override
+  public void configureGuice(DruidInjectorBuilder builder)
+  {
+    super.configureGuice(builder);
+    builder.addModule(new HllSketchModule());
   }
 
   @SuppressWarnings("resource")
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     HllSketchModule.registerSerde();
@@ -132,30 +141,6 @@ public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
     );
   }
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    final HllSketchApproxCountDistinctSqlAggregator approxCountDistinctSqlAggregator =
-        new HllSketchApproxCountDistinctSqlAggregator();
-
-    return new DruidOperatorTable(
-        ImmutableSet.of(
-            approxCountDistinctSqlAggregator,
-            new HllSketchObjectSqlAggregator(),
-
-            // Use APPROX_COUNT_DISTINCT_DS_HLL as APPROX_COUNT_DISTINCT impl for these tests.
-            new CountSqlAggregator(new ApproxCountDistinctSqlAggregator(approxCountDistinctSqlAggregator)),
-            new ApproxCountDistinctSqlAggregator(approxCountDistinctSqlAggregator)
-        ),
-        ImmutableSet.of(
-            new HllSketchSetUnionOperatorConversion(),
-            new HllSketchEstimateOperatorConversion(),
-            new HllSketchToStringOperatorConversion(),
-            new HllSketchEstimateWithErrorBoundsOperatorConversion()
-        )
-    );
-  }
-
   @Test
   public void testApproxCountDistinctHllSketch()
   {
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchComplexMetricSerdeTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchComplexMetricSerdeTest.java
index 3628c5e6212f..0ae46bef496b 100644
--- a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchComplexMetricSerdeTest.java
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchComplexMetricSerdeTest.java
@@ -23,10 +23,14 @@
 import com.google.common.collect.ImmutableMap;
 import org.apache.datasketches.kll.KllDoublesSketch;
 import org.apache.druid.data.input.MapBasedInputRow;
+import org.apache.druid.segment.data.ObjectStrategy;
 import org.apache.druid.segment.serde.ComplexMetricExtractor;
 import org.junit.Assert;
 import org.junit.Test;
 
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
 public class KllDoublesSketchComplexMetricSerdeTest
 {
   @Test
@@ -92,4 +96,44 @@ public void testExtractorOnLeadingDecimalNumber()
     Assert.assertEquals(1, sketch.getNumRetained());
     Assert.assertEquals(0.1d, sketch.getMaxValue(), 0.01d);
   }
+
+  @Test
+  public void testSafeRead()
+  {
+    final KllDoublesSketchComplexMetricSerde serde = new KllDoublesSketchComplexMetricSerde();
+    final ObjectStrategy<KllDoublesSketch> objectStrategy = serde.getObjectStrategy();
+
+    KllDoublesSketch sketch = KllDoublesSketch.newHeapInstance();
+    sketch.update(1.1);
+    sketch.update(1.2);
+    final byte[] bytes = sketch.toByteArray();
+
+    ByteBuffer buf = ByteBuffer.wrap(bytes).order(ByteOrder.LITTLE_ENDIAN);
+
+    // valid sketch should not explode when converted to byte array, which reads the memory
+    objectStrategy.fromByteBufferSafe(buf, bytes.length).toByteArray();
+
+    // corrupted sketch should fail with a regular java buffer exception, not all subsets actually fail with the same
+    // index out of bounds exceptions, but at least this many do
+    for (int subset = 3; subset < 24; subset++) {
+      final byte[] garbage2 = new byte[subset];
+      for (int i = 0; i < garbage2.length; i++) {
+        garbage2[i] = buf.get(i);
+      }
+
+      final ByteBuffer buf2 = ByteBuffer.wrap(garbage2).order(ByteOrder.LITTLE_ENDIAN);
+      Assert.assertThrows(
+          IndexOutOfBoundsException.class,
+          () -> objectStrategy.fromByteBufferSafe(buf2, garbage2.length).toByteArray()
+      );
+    }
+
+    // non sketch that is too short to contain header should fail with regular java buffer exception
+    final byte[] garbage = new byte[]{0x01, 0x02};
+    final ByteBuffer buf3 = ByteBuffer.wrap(garbage).order(ByteOrder.LITTLE_ENDIAN);
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> objectStrategy.fromByteBufferSafe(buf3, garbage.length).toByteArray()
+    );
+  }
 }
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchOperationsTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchOperationsTest.java
new file mode 100644
index 000000000000..d2b0e3839848
--- /dev/null
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllDoublesSketchOperationsTest.java
@@ -0,0 +1,51 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.aggregation.datasketches.kll;
+
+import org.apache.datasketches.kll.KllDoublesSketch;
+import org.apache.druid.java.util.common.StringUtils;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Arrays;
+
+public class KllDoublesSketchOperationsTest
+{
+  @Test
+  public void testDeserializeSafe()
+  {
+    KllDoublesSketch sketch = KllDoublesSketch.newHeapInstance();
+    sketch.update(1.1);
+    sketch.update(1.2);
+    final byte[] bytes = sketch.toByteArray();
+    final String base64 = StringUtils.encodeBase64String(bytes);
+
+    Assert.assertArrayEquals(bytes, KllDoublesSketchOperations.deserializeSafe(sketch).toByteArray());
+    Assert.assertArrayEquals(bytes, KllDoublesSketchOperations.deserializeSafe(bytes).toByteArray());
+    Assert.assertArrayEquals(bytes, KllDoublesSketchOperations.deserializeSafe(base64).toByteArray());
+
+    final byte[] trunacted = Arrays.copyOfRange(bytes, 0, 20);
+    Assert.assertThrows(IndexOutOfBoundsException.class, () -> KllDoublesSketchOperations.deserializeSafe(trunacted));
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> KllDoublesSketchOperations.deserializeSafe(StringUtils.encodeBase64String(trunacted))
+    );
+  }
+}
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchComplexMetricSerdeTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchComplexMetricSerdeTest.java
index 5ff441df1c14..c6b8c310221c 100644
--- a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchComplexMetricSerdeTest.java
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchComplexMetricSerdeTest.java
@@ -23,10 +23,14 @@
 import com.google.common.collect.ImmutableMap;
 import org.apache.datasketches.kll.KllFloatsSketch;
 import org.apache.druid.data.input.MapBasedInputRow;
+import org.apache.druid.segment.data.ObjectStrategy;
 import org.apache.druid.segment.serde.ComplexMetricExtractor;
 import org.junit.Assert;
 import org.junit.Test;
 
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
 public class KllFloatsSketchComplexMetricSerdeTest
 {
   @Test
@@ -92,4 +96,44 @@ public void testExtractorOnLeadingDecimalNumber()
     Assert.assertEquals(1, sketch.getNumRetained());
     Assert.assertEquals(0.1d, sketch.getMaxValue(), 0.01d);
   }
+
+  @Test
+  public void testSafeRead()
+  {
+    final KllFloatsSketchComplexMetricSerde serde = new KllFloatsSketchComplexMetricSerde();
+    final ObjectStrategy<KllFloatsSketch> objectStrategy = serde.getObjectStrategy();
+
+    KllFloatsSketch sketch = KllFloatsSketch.newHeapInstance();
+    sketch.update(1.1f);
+    sketch.update(1.2f);
+    final byte[] bytes = sketch.toByteArray();
+
+    ByteBuffer buf = ByteBuffer.wrap(bytes).order(ByteOrder.LITTLE_ENDIAN);
+
+    // valid sketch should not explode when converted to byte array, which reads the memory
+    objectStrategy.fromByteBufferSafe(buf, bytes.length).toByteArray();
+
+    // corrupted sketch should fail with a regular java buffer exception, not all subsets actually fail with the same
+    // index out of bounds exceptions, but at least this many do
+    for (int subset = 3; subset < 24; subset++) {
+      final byte[] garbage2 = new byte[subset];
+      for (int i = 0; i < garbage2.length; i++) {
+        garbage2[i] = buf.get(i);
+      }
+
+      final ByteBuffer buf2 = ByteBuffer.wrap(garbage2).order(ByteOrder.LITTLE_ENDIAN);
+      Assert.assertThrows(
+          IndexOutOfBoundsException.class,
+          () -> objectStrategy.fromByteBufferSafe(buf2, garbage2.length).toByteArray()
+      );
+    }
+
+    // non sketch that is too short to contain header should fail with regular java buffer exception
+    final byte[] garbage = new byte[]{0x01, 0x02};
+    final ByteBuffer buf3 = ByteBuffer.wrap(garbage).order(ByteOrder.LITTLE_ENDIAN);
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> objectStrategy.fromByteBufferSafe(buf3, garbage.length).toByteArray()
+    );
+  }
 }
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchOperationsTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchOperationsTest.java
new file mode 100644
index 000000000000..613b38c6601a
--- /dev/null
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/kll/KllFloatsSketchOperationsTest.java
@@ -0,0 +1,51 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.aggregation.datasketches.kll;
+
+import org.apache.datasketches.kll.KllFloatsSketch;
+import org.apache.druid.java.util.common.StringUtils;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Arrays;
+
+public class KllFloatsSketchOperationsTest
+{
+  @Test
+  public void testDeserializeSafe()
+  {
+    KllFloatsSketch sketch = KllFloatsSketch.newHeapInstance();
+    sketch.update(1.1f);
+    sketch.update(1.2f);
+    final byte[] bytes = sketch.toByteArray();
+    final String base64 = StringUtils.encodeBase64String(bytes);
+
+    Assert.assertArrayEquals(bytes, KllFloatsSketchOperations.deserializeSafe(sketch).toByteArray());
+    Assert.assertArrayEquals(bytes, KllFloatsSketchOperations.deserializeSafe(bytes).toByteArray());
+    Assert.assertArrayEquals(bytes, KllFloatsSketchOperations.deserializeSafe(base64).toByteArray());
+
+    final byte[] trunacted = Arrays.copyOfRange(bytes, 0, 20);
+    Assert.assertThrows(IndexOutOfBoundsException.class, () -> KllFloatsSketchOperations.deserializeSafe(trunacted));
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> KllFloatsSketchOperations.deserializeSafe(StringUtils.encodeBase64String(trunacted))
+    );
+  }
+}
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchComplexMetricSerdeTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchComplexMetricSerdeTest.java
index e198c7704257..7dc82baee925 100644
--- a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchComplexMetricSerdeTest.java
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchComplexMetricSerdeTest.java
@@ -22,11 +22,16 @@
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import org.apache.datasketches.quantiles.DoublesSketch;
+import org.apache.datasketches.quantiles.DoublesUnion;
 import org.apache.druid.data.input.MapBasedInputRow;
+import org.apache.druid.segment.data.ObjectStrategy;
 import org.apache.druid.segment.serde.ComplexMetricExtractor;
 import org.junit.Assert;
 import org.junit.Test;
 
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
 public class DoublesSketchComplexMetricSerdeTest
 {
   @Test
@@ -92,4 +97,42 @@ public void testExtractorOnLeadingDecimalNumber()
     Assert.assertEquals(1, sketch.getRetainedItems());
     Assert.assertEquals(0.1d, sketch.getMaxValue(), 0.01d);
   }
+
+  @Test
+  public void testSafeRead()
+  {
+    final DoublesSketchComplexMetricSerde serde = new DoublesSketchComplexMetricSerde();
+    DoublesUnion union = DoublesUnion.builder().setMaxK(1024).build();
+    union.update(1.1);
+    final byte[] bytes = union.toByteArray();
+
+    ByteBuffer buf = ByteBuffer.wrap(bytes).order(ByteOrder.LITTLE_ENDIAN);
+    ObjectStrategy<DoublesSketch> objectStrategy = serde.getObjectStrategy();
+
+    // valid sketch should not explode when copied, which reads the memory
+    objectStrategy.fromByteBufferSafe(buf, bytes.length).toByteArray(true);
+
+    // corrupted sketch should fail with a regular java buffer exception
+    for (int subset = 3; subset < 15; subset++) {
+      final byte[] garbage2 = new byte[subset];
+      for (int i = 0; i < garbage2.length; i++) {
+        garbage2[i] = buf.get(i);
+      }
+
+      final ByteBuffer buf2 = ByteBuffer.wrap(garbage2).order(ByteOrder.LITTLE_ENDIAN);
+      Assert.assertThrows(
+          "i " + subset,
+          IndexOutOfBoundsException.class,
+          () -> objectStrategy.fromByteBufferSafe(buf2, garbage2.length).toByteArray(true)
+      );
+    }
+
+    // non sketch that is too short to contain header should fail with regular java buffer exception
+    final byte[] garbage = new byte[]{0x01, 0x02};
+    final ByteBuffer buf3 = ByteBuffer.wrap(garbage).order(ByteOrder.LITTLE_ENDIAN);
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> objectStrategy.fromByteBufferSafe(buf3, garbage.length).toByteArray(true)
+    );
+  }
 }
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchOperationsTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchOperationsTest.java
new file mode 100644
index 000000000000..38e5d39a91b8
--- /dev/null
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/DoublesSketchOperationsTest.java
@@ -0,0 +1,50 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.aggregation.datasketches.quantiles;
+
+import org.apache.datasketches.quantiles.DoublesUnion;
+import org.apache.druid.java.util.common.StringUtils;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Arrays;
+
+public class DoublesSketchOperationsTest
+{
+  @Test
+  public void testDeserializeSafe()
+  {
+    DoublesUnion union = DoublesUnion.builder().setMaxK(1024).build();
+    union.update(1.1);
+    final byte[] bytes = union.getResult().toByteArray();
+    final String base64 = StringUtils.encodeBase64String(bytes);
+
+    Assert.assertArrayEquals(bytes, DoublesSketchOperations.deserializeSafe(union.getResult()).toByteArray());
+    Assert.assertArrayEquals(bytes, DoublesSketchOperations.deserializeSafe(bytes).toByteArray());
+    Assert.assertArrayEquals(bytes, DoublesSketchOperations.deserializeSafe(base64).toByteArray());
+
+    final byte[] trunacted = Arrays.copyOfRange(bytes, 0, 4);
+    Assert.assertThrows(IndexOutOfBoundsException.class, () -> DoublesSketchOperations.deserializeSafe(trunacted));
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> DoublesSketchOperations.deserializeSafe(StringUtils.encodeBase64(trunacted))
+    );
+  }
+}
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java
index e4a66a9a56c8..f2253462bd01 100644
--- a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/quantiles/sql/DoublesSketchSqlAggregatorTest.java
@@ -19,12 +19,11 @@
 
 package org.apache.druid.query.aggregation.datasketches.quantiles.sql;
 
-import com.fasterxml.jackson.databind.Module;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.Druids;
@@ -63,7 +62,6 @@
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
@@ -79,31 +77,18 @@
 
 public class DoublesSketchSqlAggregatorTest extends BaseCalciteQueryTest
 {
-  private static final DruidOperatorTable OPERATOR_TABLE = new DruidOperatorTable(
-      ImmutableSet.of(
-          new DoublesSketchApproxQuantileSqlAggregator(),
-          new DoublesSketchObjectSqlAggregator()
-      ),
-      ImmutableSet.of(
-          new DoublesSketchQuantileOperatorConversion(),
-          new DoublesSketchQuantilesOperatorConversion(),
-          new DoublesSketchToHistogramOperatorConversion(),
-          new DoublesSketchRankOperatorConversion(),
-          new DoublesSketchCDFOperatorConversion(),
-          new DoublesSketchSummaryOperatorConversion()
-      )
-  );
-
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    return Iterables.concat(super.getJacksonModules(), new DoublesSketchModule().getJacksonModules());
+    super.configureGuice(builder);
+    builder.addModule(new DoublesSketchModule());
   }
 
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     DoublesSketchModule.registerSerde();
@@ -141,12 +126,6 @@ public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
     );
   }
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return OPERATOR_TABLE;
-  }
-
   @Test
   public void testQuantileOnFloatAndLongs()
   {
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderObjectStrategyTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderObjectStrategyTest.java
new file mode 100644
index 000000000000..5619facd5f62
--- /dev/null
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderObjectStrategyTest.java
@@ -0,0 +1,79 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.aggregation.datasketches.theta;
+
+import org.apache.datasketches.Family;
+import org.apache.datasketches.SketchesArgumentException;
+import org.apache.datasketches.theta.SetOperation;
+import org.apache.datasketches.theta.Union;
+import org.apache.druid.java.util.common.StringUtils;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
+public class SketchHolderObjectStrategyTest
+{
+  @Test
+  public void testSafeRead()
+  {
+    SketchHolderObjectStrategy objectStrategy = new SketchHolderObjectStrategy();
+    Union union = (Union) SetOperation.builder().setNominalEntries(1024).build(Family.UNION);
+    union.update(1234L);
+
+    final byte[] bytes = union.getResult().toByteArray();
+
+    ByteBuffer buf = ByteBuffer.wrap(bytes).order(ByteOrder.LITTLE_ENDIAN);
+
+    // valid sketch should not explode when copied, which reads the memory
+    objectStrategy.fromByteBufferSafe(buf, bytes.length).getSketch().compact().getCompactBytes();
+
+    // corrupted sketch should fail with a regular java buffer exception
+    for (int subset = 3; subset < bytes.length - 1; subset++) {
+      final byte[] garbage2 = new byte[subset];
+      for (int i = 0; i < garbage2.length; i++) {
+        garbage2[i] = buf.get(i);
+      }
+
+      final ByteBuffer buf2 = ByteBuffer.wrap(garbage2).order(ByteOrder.LITTLE_ENDIAN);
+      Assert.assertThrows(
+          IndexOutOfBoundsException.class,
+          () -> objectStrategy.fromByteBufferSafe(buf2, garbage2.length).getSketch().compact().getCompactBytes()
+      );
+    }
+
+    // non sketch that is too short to contain header should fail with regular java buffer exception
+    final byte[] garbage = new byte[]{0x01, 0x02};
+    final ByteBuffer buf3 = ByteBuffer.wrap(garbage).order(ByteOrder.LITTLE_ENDIAN);
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> objectStrategy.fromByteBufferSafe(buf3, garbage.length).getSketch().compact().getCompactBytes()
+    );
+
+    // non sketch that is long enough to check (this one doesn't actually need 'safe' read)
+    final byte[] garbageLonger = StringUtils.toUtf8("notasketch");
+    final ByteBuffer buf4 = ByteBuffer.wrap(garbageLonger).order(ByteOrder.LITTLE_ENDIAN);
+    Assert.assertThrows(
+        SketchesArgumentException.class,
+        () -> objectStrategy.fromByteBufferSafe(buf4, garbageLonger.length).getSketch().compact().getCompactBytes()
+    );
+  }
+}
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderTest.java
new file mode 100644
index 000000000000..ef68fdeb8c58
--- /dev/null
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/SketchHolderTest.java
@@ -0,0 +1,52 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.aggregation.datasketches.theta;
+
+import org.apache.datasketches.Family;
+import org.apache.datasketches.theta.SetOperation;
+import org.apache.datasketches.theta.Union;
+import org.apache.druid.java.util.common.StringUtils;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Arrays;
+
+public class SketchHolderTest
+{
+  @Test
+  public void testDeserializeSafe()
+  {
+    Union union = (Union) SetOperation.builder().setNominalEntries(1024).build(Family.UNION);
+    union.update(1234L);
+    final byte[] bytes = union.getResult().toByteArray();
+    final String base64 = StringUtils.encodeBase64String(bytes);
+
+    Assert.assertArrayEquals(bytes, SketchHolder.deserializeSafe(union.getResult()).getSketch().toByteArray());
+    Assert.assertArrayEquals(bytes, SketchHolder.deserializeSafe(bytes).getSketch().toByteArray());
+    Assert.assertArrayEquals(bytes, SketchHolder.deserializeSafe(base64).getSketch().toByteArray());
+
+    final byte[] trunacted = Arrays.copyOfRange(bytes, 0, 10);
+    Assert.assertThrows(IndexOutOfBoundsException.class, () -> SketchHolder.deserializeSafe(trunacted));
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> SketchHolder.deserializeSafe(StringUtils.encodeBase64String(trunacted))
+    );
+  }
+}
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/sql/ThetaSketchSqlAggregatorTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/sql/ThetaSketchSqlAggregatorTest.java
index 128ffd9419e3..f5a23178dd02 100644
--- a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/sql/ThetaSketchSqlAggregatorTest.java
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/theta/sql/ThetaSketchSqlAggregatorTest.java
@@ -19,17 +19,14 @@
 
 package org.apache.druid.query.aggregation.datasketches.theta.sql;
 
-import com.fasterxml.jackson.databind.Module;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
-import org.apache.druid.guice.ExpressionModule;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.java.util.common.granularity.PeriodGranularity;
-import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.Druids;
 import org.apache.druid.query.QueryDataSource;
 import org.apache.druid.query.QueryRunnerFactoryConglomerate;
@@ -57,58 +54,48 @@
 import org.apache.druid.segment.virtual.ExpressionVirtualColumn;
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
-import org.apache.druid.sql.calcite.aggregation.ApproxCountDistinctSqlAggregator;
-import org.apache.druid.sql.calcite.aggregation.builtin.CountSqlAggregator;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
+import org.apache.druid.sql.guice.SqlModule;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.partition.LinearShardSpec;
 import org.joda.time.DateTimeZone;
 import org.joda.time.Period;
-import org.junit.Before;
 import org.junit.Test;
 
 import java.io.IOException;
-import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.List;
+import java.util.Properties;
 
 public class ThetaSketchSqlAggregatorTest extends BaseCalciteQueryTest
 {
   private static final String DATA_SOURCE = "foo";
 
-  private ExprMacroTable macroTable;
-
-  @Before
-  public void setUp()
-  {
-    macroTable = createMacroTable();
-  }
-
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void gatherProperties(Properties properties)
   {
-    return Iterables.concat(super.getJacksonModules(), new SketchModule().getJacksonModules());
+    super.gatherProperties(properties);
+
+    // Use APPROX_COUNT_DISTINCT_DS_THETA as APPROX_COUNT_DISTINCT impl for these tests.
+    properties.put(SqlModule.PROPERTY_SQL_APPROX_COUNT_DISTINCT_CHOICE, ThetaSketchApproxCountDistinctSqlAggregator.NAME);
   }
 
   @Override
-  public ExprMacroTable createMacroTable()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    final List<ExprMacroTable.ExprMacro> exprMacros = new ArrayList<>();
-    for (Class<? extends ExprMacroTable.ExprMacro> clazz : ExpressionModule.EXPR_MACROS) {
-      exprMacros.add(CalciteTests.INJECTOR.getInstance(clazz));
-    }
-    return new ExprMacroTable(exprMacros);
+    super.configureGuice(builder);
+    builder.addModule(new SketchModule());
   }
 
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     SketchModule.registerSerde();
@@ -148,31 +135,6 @@ public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
     );
   }
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    final ThetaSketchApproxCountDistinctSqlAggregator approxCountDistinctSqlAggregator =
-        new ThetaSketchApproxCountDistinctSqlAggregator();
-
-    return new DruidOperatorTable(
-        ImmutableSet.of(
-            new ThetaSketchApproxCountDistinctSqlAggregator(),
-            new ThetaSketchObjectSqlAggregator(),
-
-            // Use APPROX_COUNT_DISTINCT_DS_THETA as APPROX_COUNT_DISTINCT impl for these tests.
-            new CountSqlAggregator(new ApproxCountDistinctSqlAggregator(approxCountDistinctSqlAggregator)),
-            new ApproxCountDistinctSqlAggregator(approxCountDistinctSqlAggregator)
-        ),
-        ImmutableSet.of(
-            new ThetaSketchEstimateOperatorConversion(),
-            new ThetaSketchEstimateWithErrorBoundsOperatorConversion(),
-            new ThetaSketchSetIntersectOperatorConversion(),
-            new ThetaSketchSetUnionOperatorConversion(),
-            new ThetaSketchSetNotOperatorConversion()
-        )
-    );
-  }
-
   @Test
   public void testApproxCountDistinctThetaSketch()
   {
@@ -235,13 +197,13 @@ public void testApproxCountDistinctThetaSketch()
                           "v0",
                           "substring(\"dim2\", 0, 1)",
                           ColumnType.STRING,
-                          macroTable
+                          queryFramework().macroTable()
                       ),
                       new ExpressionVirtualColumn(
                           "v1",
                           "concat(substring(\"dim2\", 0, 1),'x')",
                           ColumnType.STRING,
-                          macroTable
+                          queryFramework().macroTable()
                       )
                   )
                   .aggregators(
@@ -444,7 +406,7 @@ public void testThetaSketchPostAggs()
                           "v0",
                           "concat(\"dim2\",'hello')",
                           ColumnType.STRING,
-                          macroTable
+                          queryFramework().macroTable()
                       )
                   )
                   .aggregators(
@@ -621,7 +583,7 @@ public void testThetaSketchPostAggsFinalizeOuterSketches()
                           "v0",
                           "concat(\"dim2\",'hello')",
                           ColumnType.STRING,
-                          macroTable
+                          queryFramework().macroTable()
                       )
                   )
                   .aggregators(
@@ -1052,4 +1014,12 @@ public void testGroupByAggregatorDefaultValuesFinalizeOuterSketches()
         ImmutableList.of(new Object[]{"a", 0L, 0L, "0.0", "0.0"})
     );
   }
+
+  @Test
+  public void testThetaSketchIntersectOnScalarExpression()
+  {
+    assertQueryIsUnplannable("SELECT THETA_SKETCH_INTERSECT(NULL, NULL) FROM foo",
+        "Possible error: THETA_SKETCH_INTERSECT can only be used on aggregates. " +
+            "It cannot be used directly on a column or on a scalar expression.");
+  }
 }
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchObjectStrategyTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchObjectStrategyTest.java
new file mode 100644
index 000000000000..ee59ddf57645
--- /dev/null
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchObjectStrategyTest.java
@@ -0,0 +1,70 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.aggregation.datasketches.tuple;
+
+import org.apache.datasketches.tuple.arrayofdoubles.ArrayOfDoublesUpdatableSketch;
+import org.apache.datasketches.tuple.arrayofdoubles.ArrayOfDoublesUpdatableSketchBuilder;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
+public class ArrayOfDoublesSketchObjectStrategyTest
+{
+  @Test
+  public void testSafeRead()
+  {
+    ArrayOfDoublesSketchObjectStrategy objectStrategy = new ArrayOfDoublesSketchObjectStrategy();
+    ArrayOfDoublesUpdatableSketch sketch = new ArrayOfDoublesUpdatableSketchBuilder().setNominalEntries(1024)
+                                                                                     .setNumberOfValues(4)
+                                                                                     .build();
+    sketch.update(1L, new double[]{1.0, 2.0, 3.0, 4.0});
+
+    final byte[] bytes = sketch.compact().toByteArray();
+
+    ByteBuffer buf = ByteBuffer.wrap(bytes).order(ByteOrder.LITTLE_ENDIAN);
+
+    // valid sketch should not explode when copied, which reads the memory
+    objectStrategy.fromByteBufferSafe(buf, bytes.length).compact().toByteArray();
+
+    // corrupted sketch should fail with a regular java buffer exception
+    for (int subset = 3; subset < bytes.length - 1; subset++) {
+      final byte[] garbage2 = new byte[subset];
+      for (int i = 0; i < garbage2.length; i++) {
+        garbage2[i] = buf.get(i);
+      }
+
+      final ByteBuffer buf2 = ByteBuffer.wrap(garbage2).order(ByteOrder.LITTLE_ENDIAN);
+      Assert.assertThrows(
+          IndexOutOfBoundsException.class,
+          () -> objectStrategy.fromByteBufferSafe(buf2, garbage2.length).compact().toByteArray()
+      );
+    }
+
+    // non sketch that is too short to contain header should fail with regular java buffer exception
+    final byte[] garbage = new byte[]{0x01, 0x02};
+    final ByteBuffer buf3 = ByteBuffer.wrap(garbage).order(ByteOrder.LITTLE_ENDIAN);
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> objectStrategy.fromByteBufferSafe(buf3, garbage.length).compact().toByteArray()
+    );
+  }
+}
diff --git a/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchOperationsTest.java b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchOperationsTest.java
new file mode 100644
index 000000000000..415f3acab970
--- /dev/null
+++ b/extensions-core/datasketches/src/test/java/org/apache/druid/query/aggregation/datasketches/tuple/ArrayOfDoublesSketchOperationsTest.java
@@ -0,0 +1,55 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.aggregation.datasketches.tuple;
+
+import org.apache.datasketches.tuple.arrayofdoubles.ArrayOfDoublesUpdatableSketch;
+import org.apache.datasketches.tuple.arrayofdoubles.ArrayOfDoublesUpdatableSketchBuilder;
+import org.apache.druid.java.util.common.StringUtils;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Arrays;
+
+public class ArrayOfDoublesSketchOperationsTest
+{
+  @Test
+  public void testDeserializeSafe()
+  {
+    ArrayOfDoublesSketchObjectStrategy objectStrategy = new ArrayOfDoublesSketchObjectStrategy();
+    ArrayOfDoublesUpdatableSketch sketch = new ArrayOfDoublesUpdatableSketchBuilder().setNominalEntries(1024)
+                                                                                     .setNumberOfValues(4)
+                                                                                     .build();
+    sketch.update(1L, new double[]{1.0, 2.0, 3.0, 4.0});
+
+    final byte[] bytes = sketch.toByteArray();
+    final String base64 = StringUtils.encodeBase64String(bytes);
+
+    Assert.assertArrayEquals(bytes, ArrayOfDoublesSketchOperations.deserializeSafe(sketch).toByteArray());
+    Assert.assertArrayEquals(bytes, ArrayOfDoublesSketchOperations.deserializeSafe(bytes).toByteArray());
+    Assert.assertArrayEquals(bytes, ArrayOfDoublesSketchOperations.deserializeSafe(base64).toByteArray());
+
+    final byte[] trunacted = Arrays.copyOfRange(bytes, 0, 10);
+    Assert.assertThrows(IndexOutOfBoundsException.class, () -> ArrayOfDoublesSketchOperations.deserializeSafe(trunacted));
+    Assert.assertThrows(
+        IndexOutOfBoundsException.class,
+        () -> ArrayOfDoublesSketchOperations.deserializeSafe(StringUtils.encodeBase64String(trunacted))
+    );
+  }
+}
diff --git a/extensions-core/druid-aws-rds-extensions/pom.xml b/extensions-core/druid-aws-rds-extensions/pom.xml
index b18e1aea7214..f242e1e485c5 100644
--- a/extensions-core/druid-aws-rds-extensions/pom.xml
+++ b/extensions-core/druid-aws-rds-extensions/pom.xml
@@ -30,7 +30,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/druid-basic-security/pom.xml b/extensions-core/druid-basic-security/pom.xml
index c8a3ab20e8ee..4bce2588c574 100644
--- a/extensions-core/druid-basic-security/pom.xml
+++ b/extensions-core/druid-basic-security/pom.xml
@@ -30,7 +30,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/druid-bloom-filter/pom.xml b/extensions-core/druid-bloom-filter/pom.xml
index 0bc86e8e271e..4a457f92a129 100644
--- a/extensions-core/druid-bloom-filter/pom.xml
+++ b/extensions-core/druid-bloom-filter/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregatorTest.java b/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregatorTest.java
index 26f1ce108fee..c1426048faf3 100644
--- a/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregatorTest.java
+++ b/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/aggregation/bloom/sql/BloomFilterSqlAggregatorTest.java
@@ -19,10 +19,9 @@
 
 package org.apache.druid.query.aggregation.bloom.sql;
 
-import com.fasterxml.jackson.databind.Module;
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.data.input.impl.DimensionSchema;
@@ -35,6 +34,7 @@
 import org.apache.druid.data.input.impl.TimeAndDimsParseSpec;
 import org.apache.druid.data.input.impl.TimestampSpec;
 import org.apache.druid.guice.BloomFilterExtensionModule;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.query.Druids;
 import org.apache.druid.query.QueryRunnerFactoryConglomerate;
@@ -59,7 +59,6 @@
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
@@ -76,21 +75,18 @@ public class BloomFilterSqlAggregatorTest extends BaseCalciteQueryTest
 
   private static final String DATA_SOURCE = "numfoo";
 
-  private static final DruidOperatorTable OPERATOR_TABLE = new DruidOperatorTable(
-      ImmutableSet.of(new BloomFilterSqlAggregator()),
-      ImmutableSet.of()
-  );
-
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    return Iterables.concat(super.getJacksonModules(), new BloomFilterExtensionModule().getJacksonModules());
+    super.configureGuice(builder);
+    builder.addModule(new BloomFilterExtensionModule());
   }
 
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     InputRowParser parser = new MapInputRowParser(
@@ -135,12 +131,6 @@ public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
     );
   }
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return OPERATOR_TABLE;
-  }
-
   @Test
   public void testBloomFilterAgg() throws Exception
   {
@@ -178,7 +168,7 @@ public void testBloomFilterAgg() throws Exception
                   .build()
         ),
         ImmutableList.of(
-            new Object[]{CalciteTests.getJsonMapper().writeValueAsString(expected1)}
+            new Object[]{queryFramework().queryJsonMapper().writeValueAsString(expected1)}
         )
     );
   }
@@ -211,6 +201,7 @@ public void testBloomFilterTwoAggs() throws Exception
       }
     }
 
+    ObjectMapper jsonMapper = queryFramework().queryJsonMapper();
     testQuery(
         "SELECT\n"
         + "BLOOM_FILTER(dim1, 1000),\n"
@@ -239,8 +230,8 @@ public void testBloomFilterTwoAggs() throws Exception
         ),
         ImmutableList.of(
             new Object[] {
-                CalciteTests.getJsonMapper().writeValueAsString(expected1),
-                CalciteTests.getJsonMapper().writeValueAsString(expected2)
+                jsonMapper.writeValueAsString(expected1),
+                jsonMapper.writeValueAsString(expected2)
             }
         )
     );
@@ -288,10 +279,9 @@ public void testBloomFilterAggExtractionFn() throws Exception
                   .build()
         ),
         ImmutableList.of(
-            new Object[]{CalciteTests.getJsonMapper().writeValueAsString(expected1)}
+            new Object[]{queryFramework().queryJsonMapper().writeValueAsString(expected1)}
         )
     );
-
   }
 
   @Test
@@ -335,7 +325,7 @@ public void testBloomFilterAggLong() throws Exception
                   .build()
         ),
         ImmutableList.of(
-            new Object[]{CalciteTests.getJsonMapper().writeValueAsString(expected3)}
+            new Object[]{queryFramework().queryJsonMapper().writeValueAsString(expected3)}
         )
     );
   }
@@ -388,7 +378,7 @@ public void testBloomFilterAggLongVirtualColumn() throws Exception
                   .build()
         ),
         ImmutableList.of(
-            new Object[]{CalciteTests.getJsonMapper().writeValueAsString(expected1)}
+            new Object[]{queryFramework().queryJsonMapper().writeValueAsString(expected1)}
         )
     );
   }
@@ -442,7 +432,7 @@ public void testBloomFilterAggFloatVirtualColumn() throws Exception
                   .build()
         ),
         ImmutableList.of(
-            new Object[]{CalciteTests.getJsonMapper().writeValueAsString(expected1)}
+            new Object[]{queryFramework().queryJsonMapper().writeValueAsString(expected1)}
         )
     );
   }
@@ -496,7 +486,7 @@ public void testBloomFilterAggDoubleVirtualColumn() throws Exception
                   .build()
         ),
         ImmutableList.of(
-            new Object[]{CalciteTests.getJsonMapper().writeValueAsString(expected1)}
+            new Object[]{queryFramework().queryJsonMapper().writeValueAsString(expected1)}
         )
     );
   }
@@ -510,6 +500,7 @@ public void testEmptyTimeseriesResults() throws Exception
     BloomKFilter expected1 = new BloomKFilter(TEST_NUM_ENTRIES);
     BloomKFilter expected2 = new BloomKFilter(TEST_NUM_ENTRIES);
 
+    ObjectMapper jsonMapper = queryFramework().queryJsonMapper();
     testQuery(
         "SELECT\n"
         + "BLOOM_FILTER(dim1, 1000),\n"
@@ -540,8 +531,8 @@ public void testEmptyTimeseriesResults() throws Exception
         ),
         ImmutableList.of(
             new Object[] {
-                CalciteTests.getJsonMapper().writeValueAsString(expected1),
-                CalciteTests.getJsonMapper().writeValueAsString(expected2)
+                jsonMapper.writeValueAsString(expected1),
+                jsonMapper.writeValueAsString(expected2)
             }
         )
     );
@@ -556,6 +547,7 @@ public void testGroupByAggregatorDefaultValues() throws Exception
     BloomKFilter expected1 = new BloomKFilter(TEST_NUM_ENTRIES);
     BloomKFilter expected2 = new BloomKFilter(TEST_NUM_ENTRIES);
 
+    ObjectMapper jsonMapper = queryFramework().queryJsonMapper();
     testQuery(
         "SELECT\n"
         + "dim2,\n"
@@ -596,8 +588,8 @@ public void testGroupByAggregatorDefaultValues() throws Exception
         ImmutableList.of(
             new Object[] {
                 "a",
-                CalciteTests.getJsonMapper().writeValueAsString(expected1),
-                CalciteTests.getJsonMapper().writeValueAsString(expected2)
+                jsonMapper.writeValueAsString(expected1),
+                jsonMapper.writeValueAsString(expected2)
             }
         )
     );
diff --git a/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/filter/sql/BloomDimFilterSqlTest.java b/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/filter/sql/BloomDimFilterSqlTest.java
index 4e1659c228fb..c5d6e631c410 100644
--- a/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/filter/sql/BloomDimFilterSqlTest.java
+++ b/extensions-core/druid-bloom-filter/src/test/java/org/apache/druid/query/filter/sql/BloomDimFilterSqlTest.java
@@ -19,22 +19,16 @@
 
 package org.apache.druid.query.filter.sql;
 
-import com.fasterxml.jackson.databind.Module;
 import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
 import org.apache.calcite.avatica.SqlType;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.guice.BloomFilterExtensionModule;
 import org.apache.druid.guice.BloomFilterSerializersModule;
-import org.apache.druid.guice.ExpressionModule;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.Granularities;
-import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.Druids;
 import org.apache.druid.query.aggregation.CountAggregatorFactory;
-import org.apache.druid.query.expression.LookupExprMacro;
-import org.apache.druid.query.expressions.BloomFilterExpressions;
 import org.apache.druid.query.filter.BloomDimFilter;
 import org.apache.druid.query.filter.BloomKFilter;
 import org.apache.druid.query.filter.BloomKFilterHolder;
@@ -42,50 +36,21 @@
 import org.apache.druid.query.filter.OrDimFilter;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
-import org.apache.druid.sql.calcite.aggregation.ApproxCountDistinctSqlAggregator;
-import org.apache.druid.sql.calcite.aggregation.builtin.BuiltinApproxCountDistinctSqlAggregator;
-import org.apache.druid.sql.calcite.aggregation.builtin.CountSqlAggregator;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.http.SqlParameter;
 import org.junit.Ignore;
 import org.junit.Test;
 
 import java.io.IOException;
-import java.util.ArrayList;
-import java.util.List;
 
 public class BloomDimFilterSqlTest extends BaseCalciteQueryTest
 {
   @Override
-  public DruidOperatorTable createOperatorTable()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    CalciteTests.getJsonMapper().registerModule(new BloomFilterSerializersModule());
-    return new DruidOperatorTable(
-        ImmutableSet.of(
-            new CountSqlAggregator(new ApproxCountDistinctSqlAggregator(new BuiltinApproxCountDistinctSqlAggregator()))
-        ),
-        ImmutableSet.of(new BloomFilterOperatorConversion())
-    );
-  }
-
-  @Override
-  public ExprMacroTable createMacroTable()
-  {
-    final List<ExprMacroTable.ExprMacro> exprMacros = new ArrayList<>();
-    for (Class<? extends ExprMacroTable.ExprMacro> clazz : ExpressionModule.EXPR_MACROS) {
-      exprMacros.add(CalciteTests.INJECTOR.getInstance(clazz));
-    }
-    exprMacros.add(CalciteTests.INJECTOR.getInstance(LookupExprMacro.class));
-    exprMacros.add(new BloomFilterExpressions.TestExprMacro());
-    return new ExprMacroTable(exprMacros);
-  }
-
-  @Override
-  public Iterable<? extends Module> getJacksonModules()
-  {
-    return Iterables.concat(super.getJacksonModules(), new BloomFilterExtensionModule().getJacksonModules());
+    super.configureGuice(builder);
+    builder.addModule(new BloomFilterExtensionModule());
   }
 
   @Test
@@ -144,7 +109,7 @@ public void testBloomFilterExprFilter() throws IOException
                               base64
                           ),
                           null,
-                          createMacroTable()
+                          queryFramework().macroTable()
                       )
                   )
                   .aggregators(aggregators(new CountAggregatorFactory("a0")))
diff --git a/extensions-core/druid-catalog/pom.xml b/extensions-core/druid-catalog/pom.xml
index 0678f95ff047..6a40adb17bc8 100644
--- a/extensions-core/druid-catalog/pom.xml
+++ b/extensions-core/druid-catalog/pom.xml
@@ -31,7 +31,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/druid-kerberos/pom.xml b/extensions-core/druid-kerberos/pom.xml
index a2d248348222..9a36a98ba6eb 100644
--- a/extensions-core/druid-kerberos/pom.xml
+++ b/extensions-core/druid-kerberos/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/druid-pac4j/pom.xml b/extensions-core/druid-pac4j/pom.xml
index e3e675800438..5e4807def663 100644
--- a/extensions-core/druid-pac4j/pom.xml
+++ b/extensions-core/druid-pac4j/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/druid-ranger-security/pom.xml b/extensions-core/druid-ranger-security/pom.xml
index 39d42ccb2685..edb31fe29336 100644
--- a/extensions-core/druid-ranger-security/pom.xml
+++ b/extensions-core/druid-ranger-security/pom.xml
@@ -30,7 +30,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/ec2-extensions/pom.xml b/extensions-core/ec2-extensions/pom.xml
index 57f41e3ce8f6..85e95f53a624 100644
--- a/extensions-core/ec2-extensions/pom.xml
+++ b/extensions-core/ec2-extensions/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/google-extensions/pom.xml b/extensions-core/google-extensions/pom.xml
index c29738a0cba3..ea6ab401f34c 100644
--- a/extensions-core/google-extensions/pom.xml
+++ b/extensions-core/google-extensions/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/hdfs-storage/pom.xml b/extensions-core/hdfs-storage/pom.xml
index 83a6fd8b1849..587474b5475f 100644
--- a/extensions-core/hdfs-storage/pom.xml
+++ b/extensions-core/hdfs-storage/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/histogram/pom.xml b/extensions-core/histogram/pom.xml
index 9dd821478071..67fdf2003d45 100644
--- a/extensions-core/histogram/pom.xml
+++ b/extensions-core/histogram/pom.xml
@@ -28,7 +28,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/histogram/src/test/java/org/apache/druid/query/aggregation/histogram/sql/FixedBucketsHistogramQuantileSqlAggregatorTest.java b/extensions-core/histogram/src/test/java/org/apache/druid/query/aggregation/histogram/sql/FixedBucketsHistogramQuantileSqlAggregatorTest.java
index dd6399038c3e..a4eae57756ce 100644
--- a/extensions-core/histogram/src/test/java/org/apache/druid/query/aggregation/histogram/sql/FixedBucketsHistogramQuantileSqlAggregatorTest.java
+++ b/extensions-core/histogram/src/test/java/org/apache/druid/query/aggregation/histogram/sql/FixedBucketsHistogramQuantileSqlAggregatorTest.java
@@ -19,12 +19,11 @@
 
 package org.apache.druid.query.aggregation.histogram.sql;
 
-import com.fasterxml.jackson.databind.Module;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.query.Druids;
 import org.apache.druid.query.QueryContexts;
@@ -55,7 +54,6 @@
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
@@ -68,21 +66,18 @@
 
 public class FixedBucketsHistogramQuantileSqlAggregatorTest extends BaseCalciteQueryTest
 {
-  private static final DruidOperatorTable OPERATOR_TABLE = new DruidOperatorTable(
-      ImmutableSet.of(new QuantileSqlAggregator(), new FixedBucketsHistogramQuantileSqlAggregator()),
-      ImmutableSet.of()
-  );
-
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    return Iterables.concat(super.getJacksonModules(), new ApproximateHistogramDruidModule().getJacksonModules());
+    super.configureGuice(builder);
+    builder.addModule(new ApproximateHistogramDruidModule());
   }
 
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     ApproximateHistogramDruidModule.registerSerde();
@@ -123,13 +118,6 @@ public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
     );
   }
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return OPERATOR_TABLE;
-  }
-
-
   @Test
   public void testQuantileOnFloatAndLongs()
   {
@@ -568,7 +556,6 @@ public void testEmptyTimeseriesResults()
     );
   }
 
-
   @Test
   public void testGroupByAggregatorDefaultValues()
   {
diff --git a/extensions-core/histogram/src/test/java/org/apache/druid/query/aggregation/histogram/sql/QuantileSqlAggregatorTest.java b/extensions-core/histogram/src/test/java/org/apache/druid/query/aggregation/histogram/sql/QuantileSqlAggregatorTest.java
index 6ed4c7e45106..4a67833b5249 100644
--- a/extensions-core/histogram/src/test/java/org/apache/druid/query/aggregation/histogram/sql/QuantileSqlAggregatorTest.java
+++ b/extensions-core/histogram/src/test/java/org/apache/druid/query/aggregation/histogram/sql/QuantileSqlAggregatorTest.java
@@ -19,11 +19,10 @@
 
 package org.apache.druid.query.aggregation.histogram.sql;
 
-import com.fasterxml.jackson.databind.Module;
 import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.Druids;
@@ -54,7 +53,6 @@
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
@@ -67,21 +65,18 @@
 
 public class QuantileSqlAggregatorTest extends BaseCalciteQueryTest
 {
-  private static final DruidOperatorTable OPERATOR_TABLE = new DruidOperatorTable(
-      ImmutableSet.of(new QuantileSqlAggregator()),
-      ImmutableSet.of()
-  );
-
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    return Iterables.concat(super.getJacksonModules(), new ApproximateHistogramDruidModule().getJacksonModules());
+    super.configureGuice(builder);
+    builder.addModule(new ApproximateHistogramDruidModule());
   }
 
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     ApproximateHistogramDruidModule.registerSerde();
@@ -122,12 +117,6 @@ public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
     );
   }
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return OPERATOR_TABLE;
-  }
-
   @Test
   public void testQuantileOnFloatAndLongs()
   {
diff --git a/extensions-core/kafka-extraction-namespace/pom.xml b/extensions-core/kafka-extraction-namespace/pom.xml
index 29f39f4dc2e8..1fa023dd3e64 100644
--- a/extensions-core/kafka-extraction-namespace/pom.xml
+++ b/extensions-core/kafka-extraction-namespace/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/kafka-indexing-service/pom.xml b/extensions-core/kafka-indexing-service/pom.xml
index 61102acc2bee..05a5bd840595 100644
--- a/extensions-core/kafka-indexing-service/pom.xml
+++ b/extensions-core/kafka-indexing-service/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/kafka-indexing-service/src/main/java/org/apache/druid/data/input/kafkainput/KafkaInputReader.java b/extensions-core/kafka-indexing-service/src/main/java/org/apache/druid/data/input/kafkainput/KafkaInputReader.java
index 458955e58070..56e94215940b 100644
--- a/extensions-core/kafka-indexing-service/src/main/java/org/apache/druid/data/input/kafkainput/KafkaInputReader.java
+++ b/extensions-core/kafka-indexing-service/src/main/java/org/apache/druid/data/input/kafkainput/KafkaInputReader.java
@@ -30,24 +30,24 @@
 import org.apache.druid.indexing.seekablestream.SettableByteEntity;
 import org.apache.druid.java.util.common.CloseableIterators;
 import org.apache.druid.java.util.common.Pair;
-import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.java.util.common.parsers.CloseableIterator;
 import org.apache.druid.java.util.common.parsers.ParseException;
 
 import javax.annotation.Nullable;
-
 import java.io.IOException;
+import java.util.AbstractMap;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.HashSet;
+import java.util.LinkedHashSet;
 import java.util.List;
 import java.util.Map;
+import java.util.Set;
 import java.util.function.Function;
+import java.util.stream.Collectors;
 
 public class KafkaInputReader implements InputEntityReader
 {
-  private static final Logger log = new Logger(KafkaInputReader.class);
-
   private final InputRowSchema inputRowSchema;
   private final SettableByteEntity<KafkaRecordEntity> source;
   private final Function<KafkaRecordEntity, KafkaHeaderReader> headerParserSupplier;
@@ -85,7 +85,60 @@ public KafkaInputReader(
     this.timestampColumnName = timestampColumnName;
   }
 
-  private List<String> getFinalDimensionList(HashSet<String> newDimensions)
+  @Override
+  public CloseableIterator<InputRow> read() throws IOException
+  {
+    final KafkaRecordEntity record = source.getEntity();
+    final Map<String, Object> mergedHeaderMap = new HashMap<>();
+    if (headerParserSupplier != null) {
+      KafkaHeaderReader headerParser = headerParserSupplier.apply(record);
+      List<Pair<String, Object>> headerList = headerParser.read();
+      for (Pair<String, Object> ele : headerList) {
+        mergedHeaderMap.put(ele.lhs, ele.rhs);
+      }
+    }
+
+    // Add kafka record timestamp to the mergelist, we will skip record timestamp if the same key exists already in
+    // the header list
+    mergedHeaderMap.putIfAbsent(timestampColumnName, record.getRecord().timestamp());
+
+    InputEntityReader keyParser = (keyParserSupplier == null) ? null : keyParserSupplier.apply(record);
+    if (keyParser != null) {
+      try (CloseableIterator<InputRow> keyIterator = keyParser.read()) {
+        // Key currently only takes the first row and ignores the rest.
+        if (keyIterator.hasNext()) {
+          // Return type for the key parser should be of type MapBasedInputRow
+          // Parsers returning other types are not compatible currently.
+          MapBasedInputRow keyRow = (MapBasedInputRow) keyIterator.next();
+          // Add the key to the mergeList only if the key string is not already present
+          mergedHeaderMap.putIfAbsent(
+              keyColumnName,
+              keyRow.getEvent().entrySet().stream().findFirst().get().getValue()
+          );
+        }
+      }
+      catch (ClassCastException e) {
+        throw new IOException(
+            "Unsupported keyFormat. KafkaInputformat only supports input format that return MapBasedInputRow rows"
+        );
+      }
+    }
+
+    // Ignore tombstone records that have null values.
+    if (record.getRecord().value() != null) {
+      return buildBlendedRows(valueParser, mergedHeaderMap);
+    } else {
+      return buildRowsWithoutValuePayload(mergedHeaderMap);
+    }
+  }
+
+  @Override
+  public CloseableIterator<InputRowListPlusRawValues> sample() throws IOException
+  {
+    return read().map(row -> InputRowListPlusRawValues.of(row, ((MapBasedInputRow) row).getEvent()));
+  }
+
+  private List<String> getFinalDimensionList(Set<String> newDimensions)
   {
     final List<String> schemaDimensions = inputRowSchema.getDimensionsSpec().getDimensionNames();
     if (!schemaDimensions.isEmpty()) {
@@ -97,11 +150,14 @@ private List<String> getFinalDimensionList(HashSet<String> newDimensions)
     }
   }
 
-  private CloseableIterator<InputRow> buildBlendedRows(InputEntityReader valueParser, Map<String, Object> headerKeyList) throws IOException
+  private CloseableIterator<InputRow> buildBlendedRows(
+      InputEntityReader valueParser,
+      Map<String, Object> headerKeyList
+  ) throws IOException
   {
     return valueParser.read().map(
         r -> {
-          MapBasedInputRow valueRow;
+          final MapBasedInputRow valueRow;
           try {
             // Return type for the value parser should be of type MapBasedInputRow
             // Parsers returning other types are not compatible currently.
@@ -113,14 +169,9 @@ private CloseableIterator<InputRow> buildBlendedRows(InputEntityReader valuePars
                 "Unsupported input format in valueFormat. KafkaInputFormat only supports input format that return MapBasedInputRow rows"
             );
           }
-          Map<String, Object> event = new HashMap<>(headerKeyList);
-          /* Currently we prefer payload attributes if there is a collision in names.
-              We can change this beahvior in later changes with a config knob. This default
-              behavior lets easy porting of existing inputFormats to the new one without any changes.
-            */
-          event.putAll(valueRow.getEvent());
-
-          HashSet<String> newDimensions = new HashSet<String>(valueRow.getDimensions());
+
+          final Map<String, Object> event = buildBlendedEventMap(valueRow.getEvent(), headerKeyList);
+          final HashSet<String> newDimensions = new HashSet<>(valueRow.getDimensions());
           newDimensions.addAll(headerKeyList.keySet());
           // Remove the dummy timestamp added in KafkaInputFormat
           newDimensions.remove(KafkaInputFormat.DEFAULT_AUTO_TIMESTAMP_STRING);
@@ -136,60 +187,70 @@ private CloseableIterator<InputRow> buildBlendedRows(InputEntityReader valuePars
 
   private CloseableIterator<InputRow> buildRowsWithoutValuePayload(Map<String, Object> headerKeyList)
   {
-    HashSet<String> newDimensions = new HashSet<String>(headerKeyList.keySet());
-    InputRow row = new MapBasedInputRow(
+    final InputRow row = new MapBasedInputRow(
         inputRowSchema.getTimestampSpec().extractTimestamp(headerKeyList),
-        getFinalDimensionList(newDimensions),
+        getFinalDimensionList(headerKeyList.keySet()),
         headerKeyList
     );
-    List<InputRow> rows = Collections.singletonList(row);
+    final List<InputRow> rows = Collections.singletonList(row);
     return CloseableIterators.withEmptyBaggage(rows.iterator());
   }
 
-  @Override
-  public CloseableIterator<InputRow> read() throws IOException
+  /**
+   * Builds a map that blends two {@link Map}, presenting the combined keyset of both maps, and preferring to read
+   * from the first map and falling back to the second map if the value is not present.
+   *
+   * This strategy is used rather than just copying the values of the keyset into a new map so that any 'flattening'
+   * machinery (such as {@link Map} created by {@link org.apache.druid.java.util.common.parsers.ObjectFlatteners}) is
+   * still in place to be lazily evaluated instead of eagerly copying.
+   */
+  private static Map<String, Object> buildBlendedEventMap(Map<String, Object> map, Map<String, Object> fallback)
   {
-    KafkaRecordEntity record = source.getEntity();
-    Map<String, Object> mergeMap = new HashMap<>();
-    if (headerParserSupplier != null) {
-      KafkaHeaderReader headerParser = headerParserSupplier.apply(record);
-      List<Pair<String, Object>> headerList = headerParser.read();
-      for (Pair<String, Object> ele : headerList) {
-        mergeMap.put(ele.lhs, ele.rhs);
-      }
-    }
-
-    // Add kafka record timestamp to the mergelist, we will skip record timestamp if the same key exists already in the header list
-    mergeMap.putIfAbsent(timestampColumnName, record.getRecord().timestamp());
+    final Set<String> keySet = new HashSet<>(fallback.keySet());
+    keySet.addAll(map.keySet());
 
-    InputEntityReader keyParser = (keyParserSupplier == null) ? null : keyParserSupplier.apply(record);
-    if (keyParser != null) {
-      try (CloseableIterator<InputRow> keyIterator = keyParser.read()) {
-        // Key currently only takes the first row and ignores the rest.
-        if (keyIterator.hasNext()) {
-          // Return type for the key parser should be of type MapBasedInputRow
-          // Parsers returning other types are not compatible currently.
-          MapBasedInputRow keyRow = (MapBasedInputRow) keyIterator.next();
-          // Add the key to the mergeList only if the key string is not already present
-          mergeMap.putIfAbsent(keyColumnName, keyRow.getEvent().entrySet().stream().findFirst().get().getValue());
-        }
+    return new AbstractMap<String, Object>()
+    {
+      @Override
+      public Object get(Object key)
+      {
+        return map.getOrDefault((String) key, fallback.get(key));
       }
-      catch (ClassCastException e) {
-        throw new IOException("Unsupported input format in keyFormat. KafkaInputformat only supports input format that return MapBasedInputRow rows");
+
+      @Override
+      public Set<String> keySet()
+      {
+        return keySet;
       }
-    }
 
-    // Ignore tombstone records that have null values.
-    if (record.getRecord().value() != null) {
-      return buildBlendedRows(valueParser, mergeMap);
-    } else {
-      return buildRowsWithoutValuePayload(mergeMap);
-    }
-  }
+      @Override
+      public Set<Entry<String, Object>> entrySet()
+      {
+        return keySet().stream()
+                       .map(
+                           field -> new Entry<String, Object>()
+                           {
+                             @Override
+                             public String getKey()
+                             {
+                               return field;
+                             }
 
-  @Override
-  public CloseableIterator<InputRowListPlusRawValues> sample() throws IOException
-  {
-    return read().map(row -> InputRowListPlusRawValues.of(row, ((MapBasedInputRow) row).getEvent()));
+                             @Override
+                             public Object getValue()
+                             {
+                               return get(field);
+                             }
+
+                             @Override
+                             public Object setValue(final Object value)
+                             {
+                               throw new UnsupportedOperationException();
+                             }
+                           }
+                       )
+                       .collect(Collectors.toCollection(LinkedHashSet::new));
+      }
+    };
   }
 }
diff --git a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/data/input/kafkainput/KafkaInputFormatTest.java b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/data/input/kafkainput/KafkaInputFormatTest.java
index fe0b89e996f8..a45730005a9c 100644
--- a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/data/input/kafkainput/KafkaInputFormatTest.java
+++ b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/data/input/kafkainput/KafkaInputFormatTest.java
@@ -22,12 +22,12 @@
 import com.fasterxml.jackson.core.JsonProcessingException;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.Iterables;
 import org.apache.druid.data.input.ColumnsFilter;
 import org.apache.druid.data.input.InputEntityReader;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.data.input.InputRowSchema;
-import org.apache.druid.data.input.MapBasedInputRow;
 import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.data.input.impl.JsonInputFormat;
 import org.apache.druid.data.input.impl.TimestampSpec;
@@ -205,6 +205,7 @@ public void testWithHeaderKeyAndValue() throws IOException
         Assert.assertEquals("4", Iterables.getOnlyElement(row.getDimension("root_baz")));
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("path_omg")));
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("jq_omg")));
+        Assert.assertEquals(ImmutableMap.of("mg", 1L), row.getRaw("o"));
 
         // Header verification
         Assert.assertEquals("application/json", Iterables.getOnlyElement(row.getDimension("kafka.newheader.encoding")));
@@ -342,7 +343,6 @@ public byte[] value()
       while (iterator.hasNext()) {
 
         final InputRow row = iterator.next();
-        final MapBasedInputRow mrow = (MapBasedInputRow) row;
         // Payload verifications
         Assert.assertEquals(DateTimes.of("2021-06-24"), row.getTimestamp());
         Assert.assertEquals("x", Iterables.getOnlyElement(row.getDimension("foo")));
@@ -350,6 +350,7 @@ public byte[] value()
         Assert.assertEquals("4", Iterables.getOnlyElement(row.getDimension("root_baz")));
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("path_omg")));
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("jq_omg")));
+        Assert.assertEquals(ImmutableMap.of("mg", 1L), row.getRaw("o"));
 
         // Header verification
         Assert.assertEquals("application/json", Iterables.getOnlyElement(row.getDimension("kafka.newheader.encoding")));
@@ -444,6 +445,7 @@ public void testWithOutKeyAndHeaderSpecs() throws IOException
         Assert.assertEquals("4", Iterables.getOnlyElement(row.getDimension("root_baz")));
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("path_omg")));
         Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("jq_omg")));
+        Assert.assertEquals(ImmutableMap.of("mg", 1L), row.getRaw("o"));
         numActualIterations++;
       }
 
@@ -521,6 +523,7 @@ public void testWithMultipleMixedRecords() throws IOException
           Assert.assertEquals("4", Iterables.getOnlyElement(row.getDimension("root_baz")));
           Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("path_omg")));
           Assert.assertEquals("1", Iterables.getOnlyElement(row.getDimension("jq_omg")));
+          Assert.assertEquals(ImmutableMap.of("mg", 1L), row.getRaw("o"));
           Assert.assertEquals(String.valueOf(i), Iterables.getOnlyElement(row.getDimension("index")));
 
 
diff --git a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/supervisor/KafkaSupervisorTest.java b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/supervisor/KafkaSupervisorTest.java
index ab14f4dac7d6..28b915d22cd4 100644
--- a/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/supervisor/KafkaSupervisorTest.java
+++ b/extensions-core/kafka-indexing-service/src/test/java/org/apache/druid/indexing/kafka/supervisor/KafkaSupervisorTest.java
@@ -4150,7 +4150,7 @@ public void testIsTaskCurrent()
   @Test
   public void testResumeAllActivelyReadingTasks() throws Exception
   {
-    supervisor = getTestableSupervisor(2, 2, true, "PT1H", null, null);
+    supervisor = getTestableSupervisor(2, 3, true, "PT1H", null, null);
     // Mock with task based setup for resumeAsync
     EasyMock.reset(taskClient);
     addSomeEvents(100);
@@ -4195,7 +4195,27 @@ public void testResumeAllActivelyReadingTasks() throws Exception
                                                                   supervisor.getTuningConfig()
     );
 
-    List<Task> tasks = ImmutableList.of(readingTask, publishingTask, pausedTask, failsToResumePausedTask);
+    KafkaIndexTask waitingTask = createKafkaIndexTask("waitingTask",
+                                                      DATASOURCE,
+                                                      2,
+                                                      new SeekableStreamStartSequenceNumbers<>(topic, ImmutableMap.of(2, 0L), Collections.emptySet()),
+                                                      new SeekableStreamEndSequenceNumbers<>(topic, ImmutableMap.of(2, Long.MAX_VALUE)),
+                                                      null,
+                                                      null,
+                                                      supervisor.getTuningConfig()
+    );
+
+    KafkaIndexTask pendingTask = createKafkaIndexTask("pendingTask",
+                                                      DATASOURCE,
+                                                      2,
+                                                      new SeekableStreamStartSequenceNumbers<>(topic, ImmutableMap.of(2, 0L), Collections.emptySet()),
+                                                      new SeekableStreamEndSequenceNumbers<>(topic, ImmutableMap.of(2, Long.MAX_VALUE)),
+                                                      null,
+                                                      null,
+                                                      supervisor.getTuningConfig()
+    );
+
+    List<Task> tasks = ImmutableList.of(readingTask, publishingTask, pausedTask, failsToResumePausedTask, waitingTask, pendingTask);
     Collection taskRunnerWorkItems = ImmutableList.of(
         new TestTaskRunnerWorkItem(readingTask, null, new TaskLocation("testHost", 1001, -1)),
         new TestTaskRunnerWorkItem(publishingTask, null, new TaskLocation("testHost", 1002, -1)),
@@ -4220,6 +4240,10 @@ public void testResumeAllActivelyReadingTasks() throws Exception
             .andReturn(Optional.of(TaskStatus.running(pausedTask.getId()))).anyTimes();
     EasyMock.expect(taskStorage.getStatus(failsToResumePausedTask.getId()))
             .andReturn(Optional.of(TaskStatus.running(failsToResumePausedTask.getId()))).anyTimes();
+    EasyMock.expect(taskStorage.getStatus(waitingTask.getId()))
+            .andReturn(Optional.of(TaskStatus.running(waitingTask.getId()))).anyTimes();
+    EasyMock.expect(taskStorage.getStatus(pendingTask.getId()))
+            .andReturn(Optional.of(TaskStatus.running(pendingTask.getId()))).anyTimes();
 
     EasyMock.expect(taskStorage.getTask(readingTask.getId()))
             .andReturn(Optional.of(readingTask)).anyTimes();
@@ -4229,6 +4253,10 @@ public void testResumeAllActivelyReadingTasks() throws Exception
             .andReturn(Optional.of(pausedTask)).anyTimes();
     EasyMock.expect(taskStorage.getTask(failsToResumePausedTask.getId()))
             .andReturn(Optional.of(failsToResumePausedTask)).anyTimes();
+    EasyMock.expect(taskStorage.getTask(waitingTask.getId()))
+            .andReturn(Optional.of(waitingTask)).anyTimes();
+    EasyMock.expect(taskStorage.getTask(pendingTask.getId()))
+            .andReturn(Optional.of(pendingTask)).anyTimes();
 
     EasyMock.expect(indexerMetadataStorageCoordinator.retrieveDataSourceMetadata(DATASOURCE)).andReturn(
         new KafkaDataSourceMetadata(
@@ -4237,6 +4265,12 @@ public void testResumeAllActivelyReadingTasks() throws Exception
     ).anyTimes();
     EasyMock.expect(taskQueue.add(EasyMock.anyObject(Task.class))).andReturn(true);
 
+
+    EasyMock.expect(taskClient.getStartTimeAsync(waitingTask.getId()))
+            .andReturn(Futures.immediateFuture(null));
+    EasyMock.expect(taskClient.getStartTimeAsync(pendingTask.getId()))
+            .andReturn(Futures.immediateFuture(null));
+
     EasyMock.expect(taskClient.getStatusAsync(readingTask.getId()))
             .andReturn(Futures.immediateFuture(Status.READING));
     EasyMock.expect(taskClient.getStatusAsync(publishingTask.getId()))
@@ -4245,6 +4279,10 @@ public void testResumeAllActivelyReadingTasks() throws Exception
             .andReturn(Futures.immediateFuture(Status.PAUSED));
     EasyMock.expect(taskClient.getStatusAsync(failsToResumePausedTask.getId()))
             .andReturn(Futures.immediateFuture(Status.PAUSED));
+    EasyMock.expect(taskClient.getStatusAsync(waitingTask.getId()))
+            .andReturn(Futures.immediateFuture(Status.NOT_STARTED));
+    EasyMock.expect(taskClient.getStatusAsync(pendingTask.getId()))
+            .andReturn(Futures.immediateFuture(Status.NOT_STARTED));
 
     EasyMock.expect(taskClient.getEndOffsetsAsync(publishingTask.getId()))
             .andReturn(Futures.immediateFuture(ImmutableMap.of(0, 0L)));
@@ -4258,6 +4296,12 @@ public void testResumeAllActivelyReadingTasks() throws Exception
     EasyMock.expect(taskClient.getCheckpointsAsync(failsToResumePausedTask.getId(), true))
             .andReturn(Futures.immediateFuture(new TreeMap<>()));
 
+    EasyMock.expect(taskClient.getCheckpointsAsync(waitingTask.getId(), true))
+            .andReturn(Futures.immediateFuture(null));
+
+    EasyMock.expect(taskClient.getCheckpointsAsync(pendingTask.getId(), true))
+            .andReturn(Futures.immediateFuture(null));
+
     taskRunner.registerListener(EasyMock.anyObject(TaskRunnerListener.class), EasyMock.anyObject(Executor.class));
 
     // Only the active i.e non-publishing tasks are resumed
diff --git a/extensions-core/kinesis-indexing-service/pom.xml b/extensions-core/kinesis-indexing-service/pom.xml
index 166b0291e00c..28533af40191 100644
--- a/extensions-core/kinesis-indexing-service/pom.xml
+++ b/extensions-core/kinesis-indexing-service/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/supervisor/KinesisSupervisorTest.java b/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/supervisor/KinesisSupervisorTest.java
index 50fbe2f721db..265a9fc144f8 100644
--- a/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/supervisor/KinesisSupervisorTest.java
+++ b/extensions-core/kinesis-indexing-service/src/test/java/org/apache/druid/indexing/kinesis/supervisor/KinesisSupervisorTest.java
@@ -3102,6 +3102,11 @@ public void testNoDataIngestionTasks() throws Exception
 
     EasyMock.expect(taskMaster.getTaskQueue()).andReturn(Optional.of(taskQueue)).anyTimes();
     EasyMock.expect(taskMaster.getTaskRunner()).andReturn(Optional.of(taskRunner)).anyTimes();
+    final Collection workItems = new ArrayList();
+    workItems.add(new TestTaskRunnerWorkItem(id1, null, new TaskLocation(id1.getId(), 8100, 8100)));
+    workItems.add(new TestTaskRunnerWorkItem(id2, null, new TaskLocation(id2.getId(), 8100, 8100)));
+    workItems.add(new TestTaskRunnerWorkItem(id3, null, new TaskLocation(id3.getId(), 8100, 8100)));
+    EasyMock.expect(taskRunner.getRunningTasks()).andReturn(workItems);
     EasyMock.expect(taskStorage.getActiveTasksByDatasource(DATASOURCE)).andReturn(ImmutableList.of(id1, id2, id3)).anyTimes();
     EasyMock.expect(taskStorage.getStatus("id1")).andReturn(Optional.of(TaskStatus.running("id1"))).anyTimes();
     EasyMock.expect(taskStorage.getStatus("id2")).andReturn(Optional.of(TaskStatus.running("id2"))).anyTimes();
diff --git a/extensions-core/kubernetes-extensions/pom.xml b/extensions-core/kubernetes-extensions/pom.xml
index 80e110f231a9..aec1de9b8ea1 100644
--- a/extensions-core/kubernetes-extensions/pom.xml
+++ b/extensions-core/kubernetes-extensions/pom.xml
@@ -30,7 +30,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
@@ -90,7 +90,7 @@
     <dependency>
       <groupId>org.bouncycastle</groupId>
       <artifactId>bcprov-jdk15on</artifactId>
-      <version>1.68</version>
+      <version>1.69</version>
       <scope>runtime</scope>
     </dependency>
     <dependency>
diff --git a/extensions-core/lookups-cached-global/pom.xml b/extensions-core/lookups-cached-global/pom.xml
index b9538f7cacbb..79bff849cbf5 100644
--- a/extensions-core/lookups-cached-global/pom.xml
+++ b/extensions-core/lookups-cached-global/pom.xml
@@ -28,7 +28,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/lookups-cached-single/pom.xml b/extensions-core/lookups-cached-single/pom.xml
index de98aaa38bd1..37fe9bf0e10d 100644
--- a/extensions-core/lookups-cached-single/pom.xml
+++ b/extensions-core/lookups-cached-single/pom.xml
@@ -28,7 +28,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/multi-stage-query/pom.xml b/extensions-core/multi-stage-query/pom.xml
index f8382a967b09..443b792cca65 100644
--- a/extensions-core/multi-stage-query/pom.xml
+++ b/extensions-core/multi-stage-query/pom.xml
@@ -31,7 +31,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ClusterStatisticsMergeMode.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ClusterStatisticsMergeMode.java
new file mode 100644
index 000000000000..92ed82ff5e11
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ClusterStatisticsMergeMode.java
@@ -0,0 +1,44 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.exec;
+
+/**
+ * Mode which dictates how {@link WorkerSketchFetcher} gets sketches for the partition boundaries from workers.
+ */
+public enum ClusterStatisticsMergeMode
+{
+  /**
+   * Fetches sketch in sequential order based on time. Slower due to overhead, but more accurate.
+   */
+  SEQUENTIAL,
+
+  /**
+   * Fetch all sketches from the worker at once. Faster to generate partitions, but less accurate.
+   */
+  PARALLEL,
+
+  /**
+   * Tries to decide between sequential and parallel modes based on the number of workers and size of the input
+   *
+   * If there are more than 100 workers or if the combined sketch size among all workers is more than
+   * 1,000,000,000 bytes, SEQUENTIAL mode is chosen, otherwise, PARALLEL mode is chosen.
+   */
+  AUTO
+}
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/Controller.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/Controller.java
index 07730de45e7a..fe010b219e49 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/Controller.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/Controller.java
@@ -27,7 +27,7 @@
 import org.apache.druid.msq.counters.CounterSnapshotsTree;
 import org.apache.druid.msq.indexing.MSQControllerTask;
 import org.apache.druid.msq.indexing.error.MSQErrorReport;
-import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.PartialKeyStatisticsInformation;
 
 import javax.annotation.Nullable;
 import java.util.List;
@@ -81,9 +81,11 @@ public String getId()
   // Worker-to-controller messages
 
   /**
-   * Provide a {@link ClusterByStatisticsSnapshot} for shuffling stages.
+   * Accepts a {@link PartialKeyStatisticsInformation} and updates the controller key statistics information. If all key
+   * statistics have been gathered, enqueues the task with the {@link WorkerSketchFetcher} to generate partiton boundaries.
+   * This is intended to be called by the {@link org.apache.druid.msq.indexing.ControllerChatHandler}.
    */
-  void updateStatus(int stageNumber, int workerNumber, Object keyStatisticsObject);
+  void updatePartialKeyStatisticsInformation(int stageNumber, int workerNumber, Object partialKeyStatisticsInformationObject);
 
   /**
    * System error reported by a subtask. Note that the errors are organized by
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerClient.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerClient.java
index faf1c3ff5e98..9d197b76dd17 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerClient.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerClient.java
@@ -22,7 +22,7 @@
 import org.apache.druid.msq.counters.CounterSnapshotsTree;
 import org.apache.druid.msq.indexing.error.MSQErrorReport;
 import org.apache.druid.msq.kernel.StageId;
-import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.PartialKeyStatisticsInformation;
 
 import javax.annotation.Nullable;
 import java.io.IOException;
@@ -34,13 +34,13 @@
 public interface ControllerClient extends AutoCloseable
 {
   /**
-   * Client side method to update the controller with key statistics for a particular stage and worker.
-   * Controller's implementation collates all the key statistics for a stage to generate the partition boundaries.
+   * Client side method to update the controller with partial key statistics information for a particular stage and worker.
+   * Controller's implementation collates all the information for a stage to fetch key statistics from workers.
    */
-  void postKeyStatistics(
+  void postPartialKeyStatistics(
       StageId stageId,
       int workerNumber,
-      ClusterByStatisticsSnapshot keyStatistics
+      PartialKeyStatisticsInformation partialKeyStatisticsInformation
   ) throws IOException;
 
   /**
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
index a4812292fb15..528baa4c27d1 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ControllerImpl.java
@@ -64,6 +64,7 @@
 import org.apache.druid.indexing.overlord.SegmentPublishResult;
 import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.java.util.common.DateTimes;
+import org.apache.druid.java.util.common.Either;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Intervals;
@@ -107,6 +108,7 @@
 import org.apache.druid.msq.indexing.error.MSQWarningReportLimiterPublisher;
 import org.apache.druid.msq.indexing.error.MSQWarnings;
 import org.apache.druid.msq.indexing.error.QueryNotSupportedFault;
+import org.apache.druid.msq.indexing.error.TooManyPartitionsFault;
 import org.apache.druid.msq.indexing.error.TooManyWarningsFault;
 import org.apache.druid.msq.indexing.error.UnknownFault;
 import org.apache.druid.msq.indexing.report.MSQResultsReport;
@@ -149,7 +151,8 @@
 import org.apache.druid.msq.shuffle.DurableStorageInputChannelFactory;
 import org.apache.druid.msq.shuffle.DurableStorageUtils;
 import org.apache.druid.msq.shuffle.WorkerInputChannelFactory;
-import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.CompleteKeyStatisticsInformation;
+import org.apache.druid.msq.statistics.PartialKeyStatisticsInformation;
 import org.apache.druid.msq.util.DimensionSchemaUtils;
 import org.apache.druid.msq.util.IntervalUtils;
 import org.apache.druid.msq.util.MSQFutureUtils;
@@ -201,6 +204,7 @@
 import java.util.Set;
 import java.util.concurrent.ArrayBlockingQueue;
 import java.util.concurrent.BlockingQueue;
+import java.util.concurrent.CompletableFuture;
 import java.util.concurrent.ConcurrentHashMap;
 import java.util.concurrent.ConcurrentLinkedQueue;
 import java.util.concurrent.ThreadLocalRandom;
@@ -259,6 +263,7 @@ public class ControllerImpl implements Controller
   // For live reports. Written by the main controller thread, read by HTTP threads.
   private final ConcurrentHashMap<Integer, Integer> stagePartitionCountsForLiveReports = new ConcurrentHashMap<>();
 
+  private WorkerSketchFetcher workerSketchFetcher;
   // Time at which the query started.
   // For live reports. Written by the main controller thread, read by HTTP threads.
   private volatile DateTime queryStartTime = null;
@@ -521,6 +526,16 @@ private QueryDefinition initializeQueryDefAndState(final Closer closer)
     this.netClient = new ExceptionWrappingWorkerClient(context.taskClientFor(this));
     closer.register(netClient::close);
 
+    ClusterStatisticsMergeMode clusterStatisticsMergeMode =
+        MultiStageQueryContext.getClusterStatisticsMergeMode(task.getQuerySpec().getQuery().context());
+
+    log.debug("Query [%s] cluster statistics merge mode is set to %s.", id(), clusterStatisticsMergeMode);
+
+    int statisticsMaxRetainedBytes = WorkerMemoryParameters.createProductionInstanceForController(context.injector())
+                                                                    .getPartitionStatisticsMaxRetainedBytes();
+    this.workerSketchFetcher = new WorkerSketchFetcher(netClient, clusterStatisticsMergeMode, statisticsMaxRetainedBytes);
+    closer.register(workerSketchFetcher::close);
+
     final boolean isDurableStorageEnabled =
         MultiStageQueryContext.isDurableStorageEnabled(task.getQuerySpec().getQuery().context());
 
@@ -565,10 +580,12 @@ private QueryDefinition initializeQueryDefAndState(final Closer closer)
   }
 
   /**
-   * Provide a {@link ClusterByStatisticsSnapshot} for shuffling stages.
+   * Accepts a {@link PartialKeyStatisticsInformation} and updates the controller key statistics information. If all key
+   * statistics information has been gathered, enqueues the task with the {@link WorkerSketchFetcher} to generate
+   * partiton boundaries. This is intended to be called by the {@link org.apache.druid.msq.indexing.ControllerChatHandler}.
    */
   @Override
-  public void updateStatus(int stageNumber, int workerNumber, Object keyStatisticsObject)
+  public void updatePartialKeyStatisticsInformation(int stageNumber, int workerNumber, Object partialKeyStatisticsInformationObject)
   {
     addToKernelManipulationQueue(
         queryKernel -> {
@@ -582,9 +599,9 @@ public void updateStatus(int stageNumber, int workerNumber, Object keyStatistics
               stageDef.getShuffleSpec().get().doesAggregateByClusterKey()
           );
 
-          final ClusterByStatisticsSnapshot keyStatistics;
+          final PartialKeyStatisticsInformation partialKeyStatisticsInformation;
           try {
-            keyStatistics = mapper.convertValue(keyStatisticsObject, ClusterByStatisticsSnapshot.class);
+            partialKeyStatisticsInformation = mapper.convertValue(partialKeyStatisticsInformationObject, PartialKeyStatisticsInformation.class);
           }
           catch (IllegalArgumentException e) {
             throw new IAE(
@@ -595,7 +612,36 @@ public void updateStatus(int stageNumber, int workerNumber, Object keyStatistics
             );
           }
 
-          queryKernel.addResultKeyStatisticsForStageAndWorker(stageId, workerNumber, keyStatistics);
+          queryKernel.addPartialKeyStatisticsForStageAndWorker(stageId, workerNumber, partialKeyStatisticsInformation);
+
+          if (queryKernel.getStagePhase(stageId).equals(ControllerStagePhase.MERGING_STATISTICS)) {
+            List<String> workerTaskIds = workerTaskLauncher.getTaskList();
+            CompleteKeyStatisticsInformation completeKeyStatisticsInformation =
+                queryKernel.getCompleteKeyStatisticsInformation(stageId);
+
+            // Queue the sketch fetching task into the worker sketch fetcher.
+            CompletableFuture<Either<Long, ClusterByPartitions>> clusterByPartitionsCompletableFuture =
+                workerSketchFetcher.submitFetcherTask(
+                    completeKeyStatisticsInformation,
+                    workerTaskIds,
+                    stageDef
+                );
+
+            // Add the listener to handle completion.
+            clusterByPartitionsCompletableFuture.whenComplete((clusterByPartitionsEither, throwable) -> {
+              addToKernelManipulationQueue(holder -> {
+                if (throwable != null) {
+                  holder.failStageForReason(stageId, UnknownFault.forException(throwable));
+                } else if (clusterByPartitionsEither.isError()) {
+                  holder.failStageForReason(stageId, new TooManyPartitionsFault(stageDef.getMaxPartitionCount()));
+                } else {
+                  log.debug("Query [%s] Partition boundaries generated for stage %s", id(), stageId);
+                  holder.setClusterByPartitionBoundaries(stageId, clusterByPartitionsEither.valueOrThrow());
+                }
+                holder.transitionStageKernel(stageId, queryKernel.getStagePhase(stageId));
+              });
+            });
+          }
         }
     );
   }
@@ -943,7 +989,7 @@ private QueryKit makeQueryControllerToolKit()
     final Map<Class<? extends Query>, QueryKit> kitMap =
         ImmutableMap.<Class<? extends Query>, QueryKit>builder()
                     .put(ScanQuery.class, new ScanQueryKit(context.jsonMapper()))
-                    .put(GroupByQuery.class, new GroupByQueryKit())
+                    .put(GroupByQuery.class, new GroupByQueryKit(context.jsonMapper()))
                     .build();
 
     return new MultiQueryKit(kitMap);
@@ -1959,11 +2005,7 @@ public RunQueryUntilDone(
       this.queryDef = queryDef;
       this.inputSpecSlicerFactory = inputSpecSlicerFactory;
       this.closer = closer;
-      this.queryKernel = new ControllerQueryKernel(
-          queryDef,
-          WorkerMemoryParameters.createProductionInstanceForController(context.injector())
-                                .getPartitionStatisticsMaxRetainedBytes()
-      );
+      this.queryKernel = new ControllerQueryKernel(queryDef);
     }
 
     /**
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ExceptionWrappingWorkerClient.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ExceptionWrappingWorkerClient.java
index 1c3cc39987c7..3d78b7c9ced4 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ExceptionWrappingWorkerClient.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/ExceptionWrappingWorkerClient.java
@@ -31,6 +31,7 @@
 import org.apache.druid.msq.indexing.error.WorkerRpcFailedFault;
 import org.apache.druid.msq.kernel.StageId;
 import org.apache.druid.msq.kernel.WorkOrder;
+import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
 
 import javax.annotation.Nullable;
 import java.io.IOException;
@@ -55,6 +56,23 @@ public ListenableFuture<Void> postWorkOrder(String workerTaskId, WorkOrder workO
     return wrap(workerTaskId, client, c -> c.postWorkOrder(workerTaskId, workOrder));
   }
 
+  @Override
+  public ListenableFuture<ClusterByStatisticsSnapshot> fetchClusterByStatisticsSnapshot(String workerTaskId, String queryId, int stageNumber)
+  {
+    return client.fetchClusterByStatisticsSnapshot(workerTaskId, queryId, stageNumber);
+  }
+
+  @Override
+  public ListenableFuture<ClusterByStatisticsSnapshot> fetchClusterByStatisticsSnapshotForTimeChunk(
+      String workerTaskId,
+      String queryId,
+      int stageNumber,
+      long timeChunk
+  )
+  {
+    return client.fetchClusterByStatisticsSnapshotForTimeChunk(workerTaskId, queryId, stageNumber, timeChunk);
+  }
+
   @Override
   public ListenableFuture<Void> postResultPartitionBoundaries(
       final String workerTaskId,
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/Worker.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/Worker.java
index f069c91e145a..cc5f0fae1732 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/Worker.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/Worker.java
@@ -25,6 +25,7 @@
 import org.apache.druid.msq.indexing.MSQWorkerTask;
 import org.apache.druid.msq.kernel.StageId;
 import org.apache.druid.msq.kernel.WorkOrder;
+import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
 
 import javax.annotation.Nullable;
 import java.io.IOException;
@@ -67,6 +68,18 @@ public interface Worker
    */
   void postWorkOrder(WorkOrder workOrder);
 
+  /**
+   * Returns the statistics snapshot for the given stageId. This is called from {@link WorkerSketchFetcher} under
+   * PARALLEL OR AUTO modes.
+   */
+  ClusterByStatisticsSnapshot fetchStatisticsSnapshot(StageId stageId);
+
+  /**
+   * Returns the statistics snapshot for the given stageId which contains only the sketch for the specified timeChunk.
+   * This is called from {@link WorkerSketchFetcher} under SEQUENTIAL OR AUTO modes.
+   */
+  ClusterByStatisticsSnapshot fetchStatisticsSnapshotForTimeChunk(StageId stageId, long timeChunk);
+
   /**
    * Called when the worker chat handler recieves the result partition boundaries for a particular stageNumber
    * and queryId
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerClient.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerClient.java
index 8f4c7bac239a..5c02a79f89a3 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerClient.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerClient.java
@@ -25,6 +25,7 @@
 import org.apache.druid.msq.counters.CounterSnapshotsTree;
 import org.apache.druid.msq.kernel.StageId;
 import org.apache.druid.msq.kernel.WorkOrder;
+import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
 
 import java.io.IOException;
 
@@ -38,6 +39,27 @@ public interface WorkerClient extends AutoCloseable
    */
   ListenableFuture<Void> postWorkOrder(String workerTaskId, WorkOrder workOrder);
 
+  /**
+   * Fetches the {@link ClusterByStatisticsSnapshot} from a worker. This is intended to be used by the
+   * {@link WorkerSketchFetcher} under PARALLEL or AUTO modes.
+   */
+  ListenableFuture<ClusterByStatisticsSnapshot> fetchClusterByStatisticsSnapshot(
+      String workerTaskId,
+      String queryId,
+      int stageNumber
+  );
+
+  /**
+   * Fetches a {@link ClusterByStatisticsSnapshot} which contains only the sketch of the specified timeChunk.
+   * This is intended to be used by the {@link WorkerSketchFetcher} under SEQUENTIAL or AUTO modes.
+   */
+  ListenableFuture<ClusterByStatisticsSnapshot> fetchClusterByStatisticsSnapshotForTimeChunk(
+      String workerTaskId,
+      String queryId,
+      int stageNumber,
+      long timeChunk
+  );
+
   /**
    * Worker's client method to inform it of the partition boundaries for the given stage. This is usually invoked by the
    * controller after collating the result statistics from all the workers processing the query
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java
index 5b68041d0e97..49d6f9080d7c 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerImpl.java
@@ -106,6 +106,7 @@
 import org.apache.druid.msq.shuffle.WorkerInputChannelFactory;
 import org.apache.druid.msq.statistics.ClusterByStatisticsCollector;
 import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.PartialKeyStatisticsInformation;
 import org.apache.druid.msq.util.DecoratedExecutorService;
 import org.apache.druid.msq.util.MultiStageQueryContext;
 import org.apache.druid.query.PrioritizedCallable;
@@ -159,6 +160,7 @@ public class WorkerImpl implements Worker
   private final BlockingQueue<Consumer<KernelHolder>> kernelManipulationQueue = new LinkedBlockingDeque<>();
   private final ConcurrentHashMap<StageId, ConcurrentHashMap<Integer, ReadableFrameChannel>> stageOutputs = new ConcurrentHashMap<>();
   private final ConcurrentHashMap<StageId, CounterTracker> stageCounters = new ConcurrentHashMap<>();
+  private final ConcurrentHashMap<StageId, WorkerStageKernel> stageKernelMap = new ConcurrentHashMap<>();
   private final boolean durableStageStorageEnabled;
 
   /**
@@ -365,10 +367,14 @@ public Optional<MSQErrorReport> runTask(final Closer closer) throws Exception
 
         if (kernel.getPhase() == WorkerStagePhase.READING_INPUT && kernel.hasResultKeyStatisticsSnapshot()) {
           if (controllerAlive) {
-            controllerClient.postKeyStatistics(
+            PartialKeyStatisticsInformation partialKeyStatisticsInformation =
+                kernel.getResultKeyStatisticsSnapshot()
+                      .partialKeyStatistics();
+
+            controllerClient.postPartialKeyStatistics(
                 stageDefinition.getId(),
                 kernel.getWorkOrder().getWorkerNumber(),
-                kernel.getResultKeyStatisticsSnapshot()
+                partialKeyStatisticsInformation
             );
           }
           kernel.startPreshuffleWaitingForResultPartitionBoundaries();
@@ -562,6 +568,19 @@ public void postFinish()
     kernelManipulationQueue.add(KernelHolder::setDone);
   }
 
+  @Override
+  public ClusterByStatisticsSnapshot fetchStatisticsSnapshot(StageId stageId)
+  {
+    return stageKernelMap.get(stageId).getResultKeyStatisticsSnapshot();
+  }
+
+  @Override
+  public ClusterByStatisticsSnapshot fetchStatisticsSnapshotForTimeChunk(StageId stageId, long timeChunk)
+  {
+    ClusterByStatisticsSnapshot snapshot = stageKernelMap.get(stageId).getResultKeyStatisticsSnapshot();
+    return snapshot.getSnapshotForTimeChunk(timeChunk);
+  }
+
   @Override
   public CounterSnapshotsTree getCounters()
   {
@@ -1273,9 +1292,8 @@ public ReadableFrameChannel openChannel(StageId stageId, int workerNumber, int p
     }
   }
 
-  private static class KernelHolder
+  private class KernelHolder
   {
-    private final Map<StageId, WorkerStageKernel> stageKernelMap = new HashMap<>();
     private boolean done = false;
 
     public Map<StageId, WorkerStageKernel> getStageKernelMap()
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerSketchFetcher.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerSketchFetcher.java
new file mode 100644
index 000000000000..dc6f21990587
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/exec/WorkerSketchFetcher.java
@@ -0,0 +1,344 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.exec;
+
+import com.google.common.util.concurrent.ListenableFuture;
+import org.apache.druid.frame.key.ClusterBy;
+import org.apache.druid.frame.key.ClusterByPartition;
+import org.apache.druid.frame.key.ClusterByPartitions;
+import org.apache.druid.java.util.common.Either;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.concurrent.Execs;
+import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.msq.kernel.StageDefinition;
+import org.apache.druid.msq.statistics.ClusterByStatisticsCollector;
+import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.CompleteKeyStatisticsInformation;
+
+import java.util.ArrayList;
+import java.util.HashSet;
+import java.util.Iterator;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import java.util.concurrent.CompletableFuture;
+import java.util.concurrent.ExecutorService;
+import java.util.stream.IntStream;
+
+/**
+ * Queues up fetching sketches from workers and progressively generates partitions boundaries.
+ */
+public class WorkerSketchFetcher implements AutoCloseable
+{
+  private static final Logger log = new Logger(WorkerSketchFetcher.class);
+  private static final int DEFAULT_THREAD_COUNT = 4;
+  // If the combined size of worker sketches is more than this threshold, SEQUENTIAL merging mode is used.
+  static final long BYTES_THRESHOLD = 1_000_000_000L;
+  // If there are more workers than this threshold, SEQUENTIAL merging mode is used.
+  static final long WORKER_THRESHOLD = 100;
+
+  private final ClusterStatisticsMergeMode clusterStatisticsMergeMode;
+  private final int statisticsMaxRetainedBytes;
+  private final WorkerClient workerClient;
+  private final ExecutorService executorService;
+
+  public WorkerSketchFetcher(
+      WorkerClient workerClient,
+      ClusterStatisticsMergeMode clusterStatisticsMergeMode,
+      int statisticsMaxRetainedBytes
+  )
+  {
+    this.workerClient = workerClient;
+    this.clusterStatisticsMergeMode = clusterStatisticsMergeMode;
+    this.executorService = Execs.multiThreaded(DEFAULT_THREAD_COUNT, "SketchFetcherThreadPool-%d");
+    this.statisticsMaxRetainedBytes = statisticsMaxRetainedBytes;
+  }
+
+  /**
+   * Submits a request to fetch and generate partitions for the given worker statistics and returns a future for it. It
+   * decides based on the statistics if it should fetch sketches one by one or together.
+   */
+  public CompletableFuture<Either<Long, ClusterByPartitions>> submitFetcherTask(
+      CompleteKeyStatisticsInformation completeKeyStatisticsInformation,
+      List<String> workerTaskIds,
+      StageDefinition stageDefinition
+  )
+  {
+    ClusterBy clusterBy = stageDefinition.getClusterBy();
+
+    switch (clusterStatisticsMergeMode) {
+      case SEQUENTIAL:
+        return sequentialTimeChunkMerging(completeKeyStatisticsInformation, stageDefinition, workerTaskIds);
+      case PARALLEL:
+        return inMemoryFullSketchMerging(stageDefinition, workerTaskIds);
+      case AUTO:
+        if (clusterBy.getBucketByCount() == 0) {
+          log.info("Query [%s] AUTO mode: chose PARALLEL mode to merge key statistics", stageDefinition.getId().getQueryId());
+          // If there is no time clustering, there is no scope for sequential merge
+          return inMemoryFullSketchMerging(stageDefinition, workerTaskIds);
+        } else if (stageDefinition.getMaxWorkerCount() > WORKER_THRESHOLD || completeKeyStatisticsInformation.getBytesRetained() > BYTES_THRESHOLD) {
+          log.info("Query [%s] AUTO mode: chose SEQUENTIAL mode to merge key statistics", stageDefinition.getId().getQueryId());
+          return sequentialTimeChunkMerging(completeKeyStatisticsInformation, stageDefinition, workerTaskIds);
+        }
+        log.info("Query [%s] AUTO mode: chose PARALLEL mode to merge key statistics", stageDefinition.getId().getQueryId());
+        return inMemoryFullSketchMerging(stageDefinition, workerTaskIds);
+      default:
+        throw new IllegalStateException("No fetching strategy found for mode: " + clusterStatisticsMergeMode);
+    }
+  }
+
+  /**
+   * Fetches the full {@link ClusterByStatisticsCollector} from all workers and generates partition boundaries from them.
+   * This is faster than fetching them timechunk by timechunk but the collector will be downsampled till it can fit
+   * on the controller, resulting in less accurate partition boundries.
+   */
+  CompletableFuture<Either<Long, ClusterByPartitions>> inMemoryFullSketchMerging(
+      StageDefinition stageDefinition,
+      List<String> workerTaskIds
+  )
+  {
+    CompletableFuture<Either<Long, ClusterByPartitions>> partitionFuture = new CompletableFuture<>();
+
+    // Create a new key statistics collector to merge worker sketches into
+    final ClusterByStatisticsCollector mergedStatisticsCollector =
+        stageDefinition.createResultKeyStatisticsCollector(statisticsMaxRetainedBytes);
+    final int workerCount = workerTaskIds.size();
+    // Guarded by synchronized mergedStatisticsCollector
+    final Set<Integer> finishedWorkers = new HashSet<>();
+
+    // Submit a task for each worker to fetch statistics
+    IntStream.range(0, workerCount).forEach(workerNo -> {
+      executorService.submit(() -> {
+        ListenableFuture<ClusterByStatisticsSnapshot> snapshotFuture =
+            workerClient.fetchClusterByStatisticsSnapshot(
+                workerTaskIds.get(workerNo),
+                stageDefinition.getId().getQueryId(),
+                stageDefinition.getStageNumber()
+            );
+        try {
+          ClusterByStatisticsSnapshot clusterByStatisticsSnapshot = snapshotFuture.get();
+          if (clusterByStatisticsSnapshot == null) {
+            throw new ISE("Worker %s returned null sketch, this should never happen", workerNo);
+          }
+          synchronized (mergedStatisticsCollector) {
+            mergedStatisticsCollector.addAll(clusterByStatisticsSnapshot);
+            finishedWorkers.add(workerNo);
+
+            if (finishedWorkers.size() == workerCount) {
+              log.debug("Query [%s] Received all statistics, generating partitions", stageDefinition.getId().getQueryId());
+              partitionFuture.complete(stageDefinition.generatePartitionsForShuffle(mergedStatisticsCollector));
+            }
+          }
+        }
+        catch (Exception e) {
+          synchronized (mergedStatisticsCollector) {
+            if (!partitionFuture.isDone()) {
+              partitionFuture.completeExceptionally(e);
+              mergedStatisticsCollector.clear();
+            }
+          }
+        }
+      });
+    });
+
+    return partitionFuture;
+  }
+
+  /**
+   * Fetches cluster statistics from all workers and generates partition boundaries from them one time chunk at a time.
+   * This takes longer due to the overhead of fetching sketches, however, this prevents any loss in accuracy from
+   * downsampling on the controller.
+   */
+  CompletableFuture<Either<Long, ClusterByPartitions>> sequentialTimeChunkMerging(
+      CompleteKeyStatisticsInformation completeKeyStatisticsInformation,
+      StageDefinition stageDefinition,
+      List<String> workerTaskIds
+  )
+  {
+    SequentialFetchStage sequentialFetchStage = new SequentialFetchStage(
+        stageDefinition,
+        workerTaskIds,
+        completeKeyStatisticsInformation.getTimeSegmentVsWorkerMap().entrySet().iterator()
+    );
+    sequentialFetchStage.submitFetchingTasksForNextTimeChunk();
+    return sequentialFetchStage.getPartitionFuture();
+  }
+
+  private class SequentialFetchStage
+  {
+    private final StageDefinition stageDefinition;
+    private final List<String> workerTaskIds;
+    private final Iterator<Map.Entry<Long, Set<Integer>>> timeSegmentVsWorkerIdIterator;
+    private final CompletableFuture<Either<Long, ClusterByPartitions>> partitionFuture;
+    // Final sorted list of partition boundaries. This is appended to after statistics for each time chunk are gathered.
+    private final List<ClusterByPartition> finalPartitionBoundries;
+
+    public SequentialFetchStage(
+        StageDefinition stageDefinition,
+        List<String> workerTaskIds,
+        Iterator<Map.Entry<Long, Set<Integer>>> timeSegmentVsWorkerIdIterator
+    )
+    {
+      this.finalPartitionBoundries = new ArrayList<>();
+      this.stageDefinition = stageDefinition;
+      this.workerTaskIds = workerTaskIds;
+      this.timeSegmentVsWorkerIdIterator = timeSegmentVsWorkerIdIterator;
+      this.partitionFuture = new CompletableFuture<>();
+    }
+
+    /**
+     * Submits the tasks to fetch key statistics for the time chunk pointed to by {@link #timeSegmentVsWorkerIdIterator}.
+     * Once the statistics have been gathered from all workers which have them, generates partitions and adds it to
+     * {@link #finalPartitionBoundries}, stiching the partitions between time chunks using
+     * {@link #abutAndAppendPartitionBoundries(List, List)} to make them continuous.
+     *
+     * The time chunks returned by {@link #timeSegmentVsWorkerIdIterator} should be in ascending order for the partitions
+     * to be generated correctly.
+     *
+     * If {@link #timeSegmentVsWorkerIdIterator} doesn't have any more values, assumes that partition boundaries have
+     * been successfully generated and completes {@link #partitionFuture} with the result.
+     *
+     * Completes the future with an error as soon as the number of partitions exceed max partition count for the stage
+     * definition.
+     */
+    public void submitFetchingTasksForNextTimeChunk()
+    {
+      if (!timeSegmentVsWorkerIdIterator.hasNext()) {
+        partitionFuture.complete(Either.value(new ClusterByPartitions(finalPartitionBoundries)));
+      } else {
+        Map.Entry<Long, Set<Integer>> entry = timeSegmentVsWorkerIdIterator.next();
+        // Time chunk for which partition boundries are going to be generated for
+        Long timeChunk = entry.getKey();
+        Set<Integer> workerIdsWithTimeChunk = entry.getValue();
+        // Create a new key statistics collector to merge worker sketches into
+        ClusterByStatisticsCollector mergedStatisticsCollector =
+            stageDefinition.createResultKeyStatisticsCollector(statisticsMaxRetainedBytes);
+        // Guarded by synchronized mergedStatisticsCollector
+        Set<Integer> finishedWorkers = new HashSet<>();
+
+        log.debug("Query [%s]. Submitting request for statistics for time chunk %s to %s workers",
+                  stageDefinition.getId().getQueryId(),
+                  timeChunk,
+                  workerIdsWithTimeChunk.size());
+
+        // Submits a task for every worker which has a certain time chunk
+        for (int workerNo : workerIdsWithTimeChunk) {
+          executorService.submit(() -> {
+            ListenableFuture<ClusterByStatisticsSnapshot> snapshotFuture =
+                workerClient.fetchClusterByStatisticsSnapshotForTimeChunk(
+                    workerTaskIds.get(workerNo),
+                    stageDefinition.getId().getQueryId(),
+                    stageDefinition.getStageNumber(),
+                    timeChunk
+                );
+
+            try {
+              ClusterByStatisticsSnapshot snapshotForTimeChunk = snapshotFuture.get();
+              if (snapshotForTimeChunk == null) {
+                throw new ISE("Worker %s returned null sketch for %s, this should never happen", workerNo, timeChunk);
+              }
+              synchronized (mergedStatisticsCollector) {
+                mergedStatisticsCollector.addAll(snapshotForTimeChunk);
+                finishedWorkers.add(workerNo);
+
+                if (finishedWorkers.size() == workerIdsWithTimeChunk.size()) {
+                  Either<Long, ClusterByPartitions> longClusterByPartitionsEither =
+                      stageDefinition.generatePartitionsForShuffle(mergedStatisticsCollector);
+
+                  log.debug("Query [%s]. Received all statistics for time chunk %s, generating partitions",
+                            stageDefinition.getId().getQueryId(),
+                            timeChunk);
+
+                  long totalPartitionCount = finalPartitionBoundries.size() + getPartitionCountFromEither(longClusterByPartitionsEither);
+                  if (totalPartitionCount > stageDefinition.getMaxPartitionCount()) {
+                    // Fail fast if more partitions than the maximum have been reached.
+                    partitionFuture.complete(Either.error(totalPartitionCount));
+                    mergedStatisticsCollector.clear();
+                  } else {
+                    List<ClusterByPartition> timeSketchPartitions = longClusterByPartitionsEither.valueOrThrow().ranges();
+                    abutAndAppendPartitionBoundries(finalPartitionBoundries, timeSketchPartitions);
+                    log.debug("Query [%s]. Finished generating partitions for time chunk %s, total count so far %s",
+                              stageDefinition.getId().getQueryId(),
+                              timeChunk,
+                              finalPartitionBoundries.size());
+                    submitFetchingTasksForNextTimeChunk();
+                  }
+                }
+              }
+            }
+            catch (Exception e) {
+              synchronized (mergedStatisticsCollector) {
+                if (!partitionFuture.isDone()) {
+                  partitionFuture.completeExceptionally(e);
+                  mergedStatisticsCollector.clear();
+                }
+              }
+            }
+          });
+        }
+      }
+    }
+
+    /**
+     * Takes a list of sorted {@link ClusterByPartitions} {@param timeSketchPartitions} and adds it to a sorted list
+     * {@param finalPartitionBoundries}. If {@param finalPartitionBoundries} is not empty, the end time of the last
+     * partition of {@param finalPartitionBoundries} is changed to abut with the starting time of the first partition
+     * of {@param timeSketchPartitions}.
+     *
+     * This is used to make the partitions generated continuous.
+     */
+    private void abutAndAppendPartitionBoundries(
+        List<ClusterByPartition> finalPartitionBoundries,
+        List<ClusterByPartition> timeSketchPartitions
+    )
+    {
+      if (!finalPartitionBoundries.isEmpty()) {
+        // Stitch up the end time of the last partition with the start time of the first partition.
+        ClusterByPartition clusterByPartition = finalPartitionBoundries.remove(finalPartitionBoundries.size() - 1);
+        finalPartitionBoundries.add(new ClusterByPartition(clusterByPartition.getStart(), timeSketchPartitions.get(0).getStart()));
+      }
+      finalPartitionBoundries.addAll(timeSketchPartitions);
+    }
+
+    public CompletableFuture<Either<Long, ClusterByPartitions>> getPartitionFuture()
+    {
+      return partitionFuture;
+    }
+  }
+
+  /**
+   * Gets the partition size from an {@link Either}. If it is an error, the long denotes the number of partitions
+   * (in the case of creating too many partitions), otherwise checks the size of the list.
+   */
+  private static long getPartitionCountFromEither(Either<Long, ClusterByPartitions> either)
+  {
+    if (either.isError()) {
+      return either.error();
+    } else {
+      return either.valueOrThrow().size();
+    }
+  }
+
+  @Override
+  public void close()
+  {
+    executorService.shutdownNow();
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQSqlModule.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQSqlModule.java
index e2c47c2a2dda..5335e40b0e9c 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQSqlModule.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/guice/MSQSqlModule.java
@@ -21,7 +21,6 @@
 
 import com.fasterxml.jackson.databind.Module;
 import com.google.inject.Binder;
-import com.google.inject.Inject;
 import com.google.inject.Provides;
 import org.apache.druid.discovery.NodeRole;
 import org.apache.druid.guice.LazySingleton;
@@ -33,10 +32,12 @@
 import org.apache.druid.sql.SqlStatementFactory;
 import org.apache.druid.sql.SqlToolbox;
 import org.apache.druid.sql.calcite.external.ExternalOperatorConversion;
+import org.apache.druid.sql.calcite.external.HttpOperatorConversion;
+import org.apache.druid.sql.calcite.external.InlineOperatorConversion;
+import org.apache.druid.sql.calcite.external.LocalOperatorConversion;
 import org.apache.druid.sql.guice.SqlBindings;
 
 import java.util.List;
-import java.util.Properties;
 
 /**
  * Module for providing the {@code EXTERN} operator.
@@ -44,9 +45,6 @@
 @LoadScope(roles = NodeRole.BROKER_JSON_NAME)
 public class MSQSqlModule implements DruidModule
 {
-  @Inject
-  Properties properties = null;
-
   @Override
   public List<? extends Module> getJacksonModules()
   {
@@ -64,9 +62,11 @@ public void configure(Binder binder)
 
     // Set up the EXTERN macro.
     SqlBindings.addOperatorConversion(binder, ExternalOperatorConversion.class);
+    SqlBindings.addOperatorConversion(binder, HttpOperatorConversion.class);
+    SqlBindings.addOperatorConversion(binder, InlineOperatorConversion.class);
+    SqlBindings.addOperatorConversion(binder, LocalOperatorConversion.class);
   }
 
-
   @Provides
   @MSQ
   @LazySingleton
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/ControllerChatHandler.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/ControllerChatHandler.java
index 1857d83708c7..8fa04ce6d90b 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/ControllerChatHandler.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/ControllerChatHandler.java
@@ -26,7 +26,8 @@
 import org.apache.druid.msq.exec.Controller;
 import org.apache.druid.msq.exec.ControllerClient;
 import org.apache.druid.msq.indexing.error.MSQErrorReport;
-import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.kernel.StageId;
+import org.apache.druid.msq.statistics.PartialKeyStatisticsInformation;
 import org.apache.druid.segment.realtime.firehose.ChatHandler;
 import org.apache.druid.segment.realtime.firehose.ChatHandlers;
 import org.apache.druid.server.security.Action;
@@ -58,16 +59,17 @@ public ControllerChatHandler(TaskToolbox toolbox, Controller controller)
   }
 
   /**
-   * Used by subtasks to post {@link ClusterByStatisticsSnapshot} for shuffling stages.
+   * Used by subtasks to post {@link PartialKeyStatisticsInformation} for shuffling stages.
    *
-   * See {@link ControllerClient#postKeyStatistics} for the client-side code that calls this API.
+   * See {@link ControllerClient#postPartialKeyStatistics(StageId, int, PartialKeyStatisticsInformation)}
+   * for the client-side code that calls this API.
    */
   @POST
-  @Path("/keyStatistics/{queryId}/{stageNumber}/{workerNumber}")
+  @Path("/partialKeyStatisticsInformation/{queryId}/{stageNumber}/{workerNumber}")
   @Produces(MediaType.APPLICATION_JSON)
   @Consumes(MediaType.APPLICATION_JSON)
-  public Response httpPostKeyStatistics(
-      final Object keyStatisticsObject,
+  public Response httpPostPartialKeyStatistics(
+      final Object partialKeyStatisticsObject,
       @PathParam("queryId") final String queryId,
       @PathParam("stageNumber") final int stageNumber,
       @PathParam("workerNumber") final int workerNumber,
@@ -75,7 +77,7 @@ public Response httpPostKeyStatistics(
   )
   {
     ChatHandlers.authorizationCheck(req, Action.WRITE, task.getDataSource(), toolbox.getAuthorizerMapper());
-    controller.updateStatus(stageNumber, workerNumber, keyStatisticsObject);
+    controller.updatePartialKeyStatisticsInformation(stageNumber, workerNumber, partialKeyStatisticsObject);
     return Response.status(Response.Status.ACCEPTED).build();
   }
 
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerControllerClient.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerControllerClient.java
index 3a6c9e78797b..1ff5952a8958 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerControllerClient.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerControllerClient.java
@@ -29,7 +29,7 @@
 import org.apache.druid.msq.exec.ControllerClient;
 import org.apache.druid.msq.indexing.error.MSQErrorReport;
 import org.apache.druid.msq.kernel.StageId;
-import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.PartialKeyStatisticsInformation;
 import org.apache.druid.rpc.IgnoreHttpResponseHandler;
 import org.apache.druid.rpc.RequestBuilder;
 import org.apache.druid.rpc.ServiceClient;
@@ -59,14 +59,14 @@ public IndexerControllerClient(
   }
 
   @Override
-  public void postKeyStatistics(
+  public void postPartialKeyStatistics(
       StageId stageId,
       int workerNumber,
-      ClusterByStatisticsSnapshot keyStatistics
+      PartialKeyStatisticsInformation partialKeyStatisticsInformation
   ) throws IOException
   {
     final String path = StringUtils.format(
-        "/keyStatistics/%s/%s/%d",
+        "/partialKeyStatisticsInformation/%s/%d/%d",
         StringUtils.urlEncode(stageId.getQueryId()),
         stageId.getStageNumber(),
         workerNumber
@@ -74,7 +74,7 @@ public void postKeyStatistics(
 
     doRequest(
         new RequestBuilder(HttpMethod.POST, path)
-            .jsonContent(jsonMapper, keyStatistics),
+            .jsonContent(jsonMapper, partialKeyStatisticsInformation),
         IgnoreHttpResponseHandler.INSTANCE
     );
   }
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerWorkerClient.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerWorkerClient.java
index 430c264291f8..980c7f97bee5 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerWorkerClient.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/IndexerWorkerClient.java
@@ -41,6 +41,7 @@
 import org.apache.druid.msq.exec.WorkerClient;
 import org.apache.druid.msq.kernel.StageId;
 import org.apache.druid.msq.kernel.WorkOrder;
+import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
 import org.apache.druid.rpc.IgnoreHttpResponseHandler;
 import org.apache.druid.rpc.RequestBuilder;
 import org.apache.druid.rpc.ServiceClient;
@@ -103,6 +104,48 @@ public ListenableFuture<Void> postWorkOrder(String workerTaskId, WorkOrder workO
     );
   }
 
+  @Override
+  public ListenableFuture<ClusterByStatisticsSnapshot> fetchClusterByStatisticsSnapshot(
+      String workerTaskId,
+      String queryId,
+      int stageNumber
+  )
+  {
+    String path = StringUtils.format("/keyStatistics/%s/%d",
+                                     StringUtils.urlEncode(queryId),
+                                     stageNumber);
+
+    return FutureUtils.transform(
+        getClient(workerTaskId).asyncRequest(
+            new RequestBuilder(HttpMethod.POST, path),
+            new BytesFullResponseHandler()
+        ),
+        holder -> deserialize(holder, new TypeReference<ClusterByStatisticsSnapshot>() {})
+    );
+  }
+
+  @Override
+  public ListenableFuture<ClusterByStatisticsSnapshot> fetchClusterByStatisticsSnapshotForTimeChunk(
+      String workerTaskId,
+      String queryId,
+      int stageNumber,
+      long timeChunk
+  )
+  {
+    String path = StringUtils.format("/keyStatisticsForTimeChunk/%s/%d/%d",
+                                     StringUtils.urlEncode(queryId),
+                                     stageNumber,
+                                     timeChunk);
+
+    return FutureUtils.transform(
+        getClient(workerTaskId).asyncRequest(
+            new RequestBuilder(HttpMethod.POST, path),
+            new BytesFullResponseHandler()
+        ),
+        holder -> deserialize(holder, new TypeReference<ClusterByStatisticsSnapshot>() {})
+    );
+  }
+
   @Override
   public ListenableFuture<Void> postResultPartitionBoundaries(
       String workerTaskId,
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/WorkerChatHandler.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/WorkerChatHandler.java
index 06fd8f36caf7..dd6ea7cb7124 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/WorkerChatHandler.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/WorkerChatHandler.java
@@ -28,6 +28,7 @@
 import org.apache.druid.msq.exec.Worker;
 import org.apache.druid.msq.kernel.StageId;
 import org.apache.druid.msq.kernel.WorkOrder;
+import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
 import org.apache.druid.segment.realtime.firehose.ChatHandler;
 import org.apache.druid.segment.realtime.firehose.ChatHandlers;
 import org.apache.druid.server.security.Action;
@@ -179,6 +180,45 @@ public Response httpPostResultPartitionBoundaries(
     }
   }
 
+  @POST
+  @Path("/keyStatistics/{queryId}/{stageNumber}")
+  @Produces(MediaType.APPLICATION_JSON)
+  @Consumes(MediaType.APPLICATION_JSON)
+  public Response httpFetchKeyStatistics(
+      @PathParam("queryId") final String queryId,
+      @PathParam("stageNumber") final int stageNumber,
+      @Context final HttpServletRequest req
+  )
+  {
+    ChatHandlers.authorizationCheck(req, Action.READ, task.getDataSource(), toolbox.getAuthorizerMapper());
+    ClusterByStatisticsSnapshot clusterByStatisticsSnapshot;
+    StageId stageId = new StageId(queryId, stageNumber);
+    clusterByStatisticsSnapshot = worker.fetchStatisticsSnapshot(stageId);
+    return Response.status(Response.Status.ACCEPTED)
+                   .entity(clusterByStatisticsSnapshot)
+                   .build();
+  }
+
+  @POST
+  @Path("/keyStatisticsForTimeChunk/{queryId}/{stageNumber}/{timeChunk}")
+  @Produces(MediaType.APPLICATION_JSON)
+  @Consumes(MediaType.APPLICATION_JSON)
+  public Response httpSketch(
+      @PathParam("queryId") final String queryId,
+      @PathParam("stageNumber") final int stageNumber,
+      @PathParam("timeChunk") final long timeChunk,
+      @Context final HttpServletRequest req
+  )
+  {
+    ChatHandlers.authorizationCheck(req, Action.READ, task.getDataSource(), toolbox.getAuthorizerMapper());
+    ClusterByStatisticsSnapshot snapshotForTimeChunk;
+    StageId stageId = new StageId(queryId, stageNumber);
+    snapshotForTimeChunk = worker.fetchStatisticsSnapshotForTimeChunk(stageId, timeChunk);
+    return Response.status(Response.Status.ACCEPTED)
+                   .entity(snapshotForTimeChunk)
+                   .build();
+  }
+
   /**
    * See {@link org.apache.druid.msq.exec.WorkerClient#postCleanupStage} for the client-side code that calls this API.
    */
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/TooManyBucketsFault.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/TooManyBucketsFault.java
index 8af20d091910..fdad421e6490 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/TooManyBucketsFault.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/indexing/error/TooManyBucketsFault.java
@@ -41,7 +41,7 @@ public TooManyBucketsFault(@JsonProperty("maxBuckets") final int maxBuckets)
     super(
         CODE,
         "Too many partition buckets (max = %,d); try breaking your query up into smaller queries or "
-        + "using a wider segmentGranularity",
+        + "using a wider PARTITIONED BY",
         maxBuckets
     );
     this.maxBuckets = maxBuckets;
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerQueryKernel.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerQueryKernel.java
index 9de5c692c990..d2e9f198f04b 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerQueryKernel.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerQueryKernel.java
@@ -41,7 +41,8 @@
 import org.apache.druid.msq.kernel.StageId;
 import org.apache.druid.msq.kernel.WorkOrder;
 import org.apache.druid.msq.kernel.WorkerAssignmentStrategy;
-import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.CompleteKeyStatisticsInformation;
+import org.apache.druid.msq.statistics.PartialKeyStatisticsInformation;
 
 import javax.annotation.Nullable;
 import java.util.HashMap;
@@ -65,7 +66,6 @@
 public class ControllerQueryKernel
 {
   private final QueryDefinition queryDef;
-  private final int partitionStatisticsMaxRetainedBytes;
 
   /**
    * Stage ID -> tracker for that stage. An extension of the state of this kernel.
@@ -107,10 +107,9 @@ public class ControllerQueryKernel
    */
   private final Set<StageId> effectivelyFinishedStages = new HashSet<>();
 
-  public ControllerQueryKernel(final QueryDefinition queryDef, final int partitionStatisticsMaxRetainedBytes)
+  public ControllerQueryKernel(final QueryDefinition queryDef)
   {
     this.queryDef = queryDef;
-    this.partitionStatisticsMaxRetainedBytes = partitionStatisticsMaxRetainedBytes;
     this.inflowMap = ImmutableMap.copyOf(computeStageInflowMap(queryDef));
     this.outflowMap = ImmutableMap.copyOf(computeStageOutflowMap(queryDef));
 
@@ -266,8 +265,7 @@ private void createNewKernels(
           stageDef,
           stageWorkerCountMap,
           slicer,
-          assignmentStrategy,
-          partitionStatisticsMaxRetainedBytes
+          assignmentStrategy
       );
       stageTracker.put(nextStage, stageKernel);
     }
@@ -334,6 +332,22 @@ public ClusterByPartitions getResultPartitionBoundariesForStage(final StageId st
     return getStageKernelOrThrow(stageId).getResultPartitionBoundaries();
   }
 
+  /**
+   * Delegates call to {@link ControllerStageTracker#getCompleteKeyStatisticsInformation()}
+   */
+  public CompleteKeyStatisticsInformation getCompleteKeyStatisticsInformation(final StageId stageId)
+  {
+    return getStageKernelOrThrow(stageId).getCompleteKeyStatisticsInformation();
+  }
+
+  /**
+   * Delegates call to {@link ControllerStageTracker#setClusterByPartitionBoundaries(ClusterByPartitions)} ()}
+   */
+  public void setClusterByPartitionBoundaries(final StageId stageId, ClusterByPartitions clusterByPartitions)
+  {
+    getStageKernelOrThrow(stageId).setClusterByPartitionBoundaries(clusterByPartitions);
+  }
+
   /**
    * Delegates call to {@link ControllerStageTracker#collectorEncounteredAnyMultiValueField()}
    */
@@ -390,22 +404,24 @@ public WorkerInputs getWorkerInputsForStage(final StageId stageId)
   }
 
   /**
-   * Delegates call to {@link ControllerStageTracker#addResultKeyStatisticsForWorker(int, ClusterByStatisticsSnapshot)}.
+   * Delegates call to {@link ControllerStageTracker#addPartialKeyStatisticsForWorker(int, PartialKeyStatisticsInformation)}.
    * If calling this causes transition for the stage kernel, then this gets registered in this query kernel
    */
-  public void addResultKeyStatisticsForStageAndWorker(
+  public void addPartialKeyStatisticsForStageAndWorker(
       final StageId stageId,
       final int workerNumber,
-      final ClusterByStatisticsSnapshot snapshot
+      final PartialKeyStatisticsInformation partialKeyStatisticsInformation
   )
   {
-    ControllerStagePhase newPhase = getStageKernelOrThrow(stageId).addResultKeyStatisticsForWorker(
+    ControllerStageTracker stageKernel = getStageKernelOrThrow(stageId);
+    ControllerStagePhase newPhase = stageKernel.addPartialKeyStatisticsForWorker(
         workerNumber,
-        snapshot
+        partialKeyStatisticsInformation
     );
 
-    // If the phase is POST_READING or FAILED, that implies the kernel has transitioned. We need to account for that
+    // If the kernel phase has transitioned, we need to account for that.
     switch (newPhase) {
+      case MERGING_STATISTICS:
       case POST_READING:
       case FAILED:
         transitionStageKernel(stageId, newPhase);
@@ -436,6 +452,12 @@ public MSQFault getFailureReasonForStage(final StageId stageId)
     return getStageKernelOrThrow(stageId).getFailureReason();
   }
 
+  public void failStageForReason(final StageId stageId, MSQFault fault)
+  {
+    getStageKernelOrThrow(stageId).failForReason(fault);
+    transitionStageKernel(stageId, ControllerStagePhase.FAILED);
+  }
+
   /**
    * Delegates call to {@link ControllerStageTracker#fail()} and registers this transition to FAILED in this query kernel
    */
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerStagePhase.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerStagePhase.java
index 6686292c1d85..896b345b4d22 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerStagePhase.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerStagePhase.java
@@ -48,6 +48,17 @@ public boolean canTransitionFrom(final ControllerStagePhase priorPhase)
     }
   },
 
+  // Waiting to fetch key statistics in the background from the workers and incrementally generate partitions.
+  // This phase is only transitioned to once all partialKeyInformation are recieved from workers.
+  // Transitioning to this phase should also enqueue the task to fetch key statistics to WorkerSketchFetcher.
+  MERGING_STATISTICS {
+    @Override
+    public boolean canTransitionFrom(final ControllerStagePhase priorPhase)
+    {
+      return priorPhase == READING_INPUT;
+    }
+  },
+
   // Post the inputs have been read and mapped to frames, in the `POST_READING` stage, we pre-shuffle and determing the partition boundaries.
   // This step for a stage spits out the statistics of the data as a whole (and not just the individual records). This
   // phase is not required in non-pre shuffle contexts.
@@ -55,7 +66,7 @@ public boolean canTransitionFrom(final ControllerStagePhase priorPhase)
     @Override
     public boolean canTransitionFrom(final ControllerStagePhase priorPhase)
     {
-      return priorPhase == READING_INPUT;
+      return priorPhase == MERGING_STATISTICS;
     }
   },
 
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerStageTracker.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerStageTracker.java
index 3ad01a513c80..bf53239335c5 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerStageTracker.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/kernel/controller/ControllerStageTracker.java
@@ -28,6 +28,7 @@
 import org.apache.druid.java.util.common.Either;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.msq.indexing.error.InsertTimeNullFault;
 import org.apache.druid.msq.indexing.error.MSQFault;
 import org.apache.druid.msq.indexing.error.TooManyPartitionsFault;
 import org.apache.druid.msq.indexing.error.UnknownFault;
@@ -38,11 +39,12 @@
 import org.apache.druid.msq.input.stage.StageInputSlice;
 import org.apache.druid.msq.kernel.StageDefinition;
 import org.apache.druid.msq.kernel.WorkerAssignmentStrategy;
-import org.apache.druid.msq.statistics.ClusterByStatisticsCollector;
-import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.CompleteKeyStatisticsInformation;
+import org.apache.druid.msq.statistics.PartialKeyStatisticsInformation;
 
 import javax.annotation.Nullable;
 import java.util.List;
+import java.util.TreeMap;
 
 /**
  * Controller-side state machine for each stage. Used by {@link ControllerQueryKernel} to form the overall state
@@ -57,13 +59,13 @@ class ControllerStageTracker
   private final int workerCount;
 
   private final WorkerInputs workerInputs;
-  private final IntSet workersWithResultKeyStatistics = new IntAVLTreeSet();
+  private final IntSet workersWithReportedKeyStatistics = new IntAVLTreeSet();
   private final IntSet workersWithResultsComplete = new IntAVLTreeSet();
 
   private ControllerStagePhase phase = ControllerStagePhase.NEW;
 
   @Nullable
-  private final ClusterByStatisticsCollector resultKeyStatisticsCollector;
+  public final CompleteKeyStatisticsInformation completeKeyStatisticsInformation;
 
   // Result partitions and where they can be read from.
   @Nullable
@@ -81,8 +83,7 @@ class ControllerStageTracker
 
   private ControllerStageTracker(
       final StageDefinition stageDef,
-      final WorkerInputs workerInputs,
-      final int partitionStatisticsMaxRetainedBytes
+      final WorkerInputs workerInputs
   )
   {
     this.stageDef = stageDef;
@@ -90,11 +91,11 @@ private ControllerStageTracker(
     this.workerInputs = workerInputs;
 
     if (stageDef.mustGatherResultKeyStatistics()) {
-      this.resultKeyStatisticsCollector =
-          stageDef.createResultKeyStatisticsCollector(partitionStatisticsMaxRetainedBytes);
+      this.completeKeyStatisticsInformation =
+          new CompleteKeyStatisticsInformation(new TreeMap<>(), false, 0);
     } else {
-      this.resultKeyStatisticsCollector = null;
-      generateResultPartitionsAndBoundaries();
+      this.completeKeyStatisticsInformation = null;
+      generateResultPartitionsAndBoundariesWithoutKeyStatistics();
     }
   }
 
@@ -107,12 +108,11 @@ static ControllerStageTracker create(
       final StageDefinition stageDef,
       final Int2IntMap stageWorkerCountMap,
       final InputSpecSlicer slicer,
-      final WorkerAssignmentStrategy assignmentStrategy,
-      final int partitionStatisticsMaxRetainedBytes
+      final WorkerAssignmentStrategy assignmentStrategy
   )
   {
     final WorkerInputs workerInputs = WorkerInputs.create(stageDef, stageWorkerCountMap, slicer, assignmentStrategy);
-    return new ControllerStageTracker(stageDef, workerInputs, partitionStatisticsMaxRetainedBytes);
+    return new ControllerStageTracker(stageDef, workerInputs);
   }
 
   /**
@@ -175,18 +175,12 @@ ClusterByPartitions getResultPartitionBoundaries()
    */
   boolean collectorEncounteredAnyMultiValueField()
   {
-    if (resultKeyStatisticsCollector == null) {
+    if (completeKeyStatisticsInformation == null) {
       throw new ISE("Stage does not gather result key statistics");
-    } else if (resultPartitions == null) {
+    } else if (workersWithReportedKeyStatistics.size() != workerCount) {
       throw new ISE("Result key statistics are not ready");
     } else {
-      for (int i = 0; i < resultKeyStatisticsCollector.getClusterBy().getColumns().size(); i++) {
-        if (resultKeyStatisticsCollector.hasMultipleValues(i)) {
-          return true;
-        }
-      }
-
-      return false;
+      return completeKeyStatisticsInformation.hasMultipleValues();
     }
   }
 
@@ -219,10 +213,6 @@ void start()
    */
   void finish()
   {
-    if (resultKeyStatisticsCollector != null) {
-      resultKeyStatisticsCollector.clear();
-    }
-
     transitionTo(ControllerStagePhase.FINISHED);
   }
 
@@ -234,23 +224,31 @@ WorkerInputs getWorkerInputs()
     return workerInputs;
   }
 
+  /**
+   * Returns the merged key statistics.
+   */
+  @Nullable
+  public CompleteKeyStatisticsInformation getCompleteKeyStatisticsInformation()
+  {
+    return completeKeyStatisticsInformation;
+  }
+
   /**
    * Adds result key statistics for a particular worker number. If statistics have already been added for this worker,
    * then this call ignores the new ones and does nothing.
    *
    * @param workerNumber the worker
-   * @param snapshot     worker statistics
+   * @param partialKeyStatisticsInformation partial key statistics
    */
-  ControllerStagePhase addResultKeyStatisticsForWorker(
+  ControllerStagePhase addPartialKeyStatisticsForWorker(
       final int workerNumber,
-      final ClusterByStatisticsSnapshot snapshot
+      final PartialKeyStatisticsInformation partialKeyStatisticsInformation
   )
   {
     if (phase != ControllerStagePhase.READING_INPUT) {
       throw new ISE("Cannot add result key statistics from stage [%s]", phase);
     }
-
-    if (resultKeyStatisticsCollector == null) {
+    if (!stageDef.mustGatherResultKeyStatistics() || !stageDef.doesShuffle() || completeKeyStatisticsInformation == null) {
       throw new ISE("Stage does not gather result key statistics");
     }
 
@@ -259,16 +257,21 @@ ControllerStagePhase addResultKeyStatisticsForWorker(
     }
 
     try {
-      if (workersWithResultKeyStatistics.add(workerNumber)) {
-        resultKeyStatisticsCollector.addAll(snapshot);
+      if (workersWithReportedKeyStatistics.add(workerNumber)) {
 
-        if (workersWithResultKeyStatistics.size() == workerCount) {
-          generateResultPartitionsAndBoundaries();
+        if (partialKeyStatisticsInformation.getTimeSegments().contains(null)) {
+          // Time should not contain null value
+          failForReason(InsertTimeNullFault.instance());
+          return getPhase();
+        }
+
+        completeKeyStatisticsInformation.mergePartialInformation(workerNumber, partialKeyStatisticsInformation);
+
+        if (workersWithReportedKeyStatistics.size() == workerCount) {
+          // All workers have sent the partial key statistics information.
+          // Transition to MERGING_STATISTICS state to queue fetch clustering statistics from workers.
+          transitionTo(ControllerStagePhase.MERGING_STATISTICS);
 
-          // Phase can become FAILED after generateResultPartitionsAndBoundaries, if there were too many partitions.
-          if (phase != ControllerStagePhase.FAILED) {
-            transitionTo(ControllerStagePhase.POST_READING);
-          }
         }
       }
     }
@@ -280,6 +283,33 @@ ControllerStagePhase addResultKeyStatisticsForWorker(
     return getPhase();
   }
 
+  /**
+   * Sets the {@link #resultPartitions} and {@link #resultPartitionBoundaries} and transitions the phase to POST_READING.
+   */
+  void setClusterByPartitionBoundaries(ClusterByPartitions clusterByPartitions)
+  {
+    if (resultPartitions != null) {
+      throw new ISE("Result partitions have already been generated");
+    }
+
+    if (!stageDef.mustGatherResultKeyStatistics()) {
+      throw new ISE("Result partitions does not require key statistics, should not have set partition boundries here");
+    }
+
+    if (!ControllerStagePhase.MERGING_STATISTICS.equals(getPhase())) {
+      throw new ISE("Cannot set partition boundires from key statistics from stage [%s]", getPhase());
+    }
+
+    this.resultPartitionBoundaries = clusterByPartitions;
+    this.resultPartitions = ReadablePartitions.striped(
+        stageDef.getStageNumber(),
+        workerCount,
+        clusterByPartitions.size()
+    );
+
+    transitionTo(ControllerStagePhase.POST_READING);
+  }
+
   /**
    * Accepts and sets the results that each worker produces for this particular stage
    *
@@ -339,12 +369,11 @@ void fail()
   }
 
   /**
-   * Sets {@link #resultPartitions} (always) and {@link #resultPartitionBoundaries}.
+   * Sets {@link #resultPartitions} (always) and {@link #resultPartitionBoundaries} without using key statistics.
    *
-   * If {@link StageDefinition#mustGatherResultKeyStatistics()} is true, this method cannot be called until after
-   * statistics have been provided to {@link #addResultKeyStatisticsForWorker} for all workers.
+   * If {@link StageDefinition#mustGatherResultKeyStatistics()} is true, this method should not be called.
    */
-  private void generateResultPartitionsAndBoundaries()
+  private void generateResultPartitionsAndBoundariesWithoutKeyStatistics()
   {
     if (resultPartitions != null) {
       throw new ISE("Result partitions have already been generated");
@@ -353,12 +382,12 @@ private void generateResultPartitionsAndBoundaries()
     final int stageNumber = stageDef.getStageNumber();
 
     if (stageDef.doesShuffle()) {
-      if (stageDef.mustGatherResultKeyStatistics() && workersWithResultKeyStatistics.size() != workerCount) {
-        throw new ISE("Cannot generate result partitions without all worker statistics");
+      if (stageDef.mustGatherResultKeyStatistics()) {
+        throw new ISE("Cannot generate result partitions without key statistics");
       }
 
       final Either<Long, ClusterByPartitions> maybeResultPartitionBoundaries =
-          stageDef.generatePartitionsForShuffle(resultKeyStatisticsCollector);
+          stageDef.generatePartitionsForShuffle(null);
 
       if (maybeResultPartitionBoundaries.isError()) {
         failForReason(new TooManyPartitionsFault(stageDef.getMaxPartitionCount()));
@@ -397,15 +426,11 @@ private void generateResultPartitionsAndBoundaries()
    *
    * @param fault reason why this stage has failed
    */
-  private void failForReason(final MSQFault fault)
+  void failForReason(final MSQFault fault)
   {
     transitionTo(ControllerStagePhase.FAILED);
 
     this.failureReason = fault;
-
-    if (resultKeyStatisticsCollector != null) {
-      resultKeyStatisticsCollector.clear();
-    }
   }
 
   void transitionTo(final ControllerStagePhase newPhase)
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/DataSourcePlan.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/DataSourcePlan.java
index a5c61c5bd75e..30544cf31bff 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/DataSourcePlan.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/DataSourcePlan.java
@@ -51,6 +51,7 @@
 import org.apache.druid.segment.column.ColumnHolder;
 import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.sql.calcite.external.ExternalDataSource;
+import org.apache.druid.sql.calcite.parser.DruidSqlInsert;
 import org.joda.time.Interval;
 
 import javax.annotation.Nullable;
@@ -67,6 +68,16 @@
  */
 public class DataSourcePlan
 {
+  /**
+   * A map with {@link DruidSqlInsert#SQL_INSERT_SEGMENT_GRANULARITY} set to null, so we can clear it from the context
+   * of subqueries.
+   */
+  private static final Map<String, Object> CONTEXT_MAP_NO_SEGMENT_GRANULARITY = new HashMap<>();
+
+  static {
+    CONTEXT_MAP_NO_SEGMENT_GRANULARITY.put(DruidSqlInsert.SQL_INSERT_SEGMENT_GRANULARITY, null);
+  }
+
   private final DataSource newDataSource;
   private final List<InputSpec> inputSpecs;
   private final IntSet broadcastInputs;
@@ -247,7 +258,10 @@ private static DataSourcePlan forQuery(
   {
     final QueryDefinition subQueryDef = queryKit.makeQueryDefinition(
         queryId,
-        dataSource.getQuery(),
+
+        // Subqueries ignore SQL_INSERT_SEGMENT_GRANULARITY, even if set in the context. It's only used for the
+        // outermost query, and setting it for the subquery makes us erroneously add bucketing where it doesn't belong.
+        dataSource.getQuery().withOverriddenContext(CONTEXT_MAP_NO_SEGMENT_GRANULARITY),
         queryKit,
         ShuffleSpecFactories.subQueryWithMaxWorkerCount(maxWorkerCount),
         maxWorkerCount,
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/QueryKitUtils.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/QueryKitUtils.java
index fcd723291650..1f863a8c735e 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/QueryKitUtils.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/QueryKitUtils.java
@@ -24,7 +24,6 @@
 import org.apache.calcite.sql.dialect.CalciteSqlDialect;
 import org.apache.druid.frame.key.ClusterBy;
 import org.apache.druid.frame.key.SortColumn;
-import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
@@ -76,15 +75,16 @@ public class QueryKitUtils
    */
   public static final String CTX_TIME_COLUMN_NAME = "__timeColumn";
 
-  private static final ObjectMapper OBJECT_MAPPER = new DefaultObjectMapper();
-
-  public static Granularity getSegmentGranularityFromContext(@Nullable final Map<String, Object> context)
+  public static Granularity getSegmentGranularityFromContext(
+      final ObjectMapper objectMapper,
+      @Nullable final Map<String, Object> context
+  )
   {
     final Object o = context == null ? null : context.get(DruidSqlInsert.SQL_INSERT_SEGMENT_GRANULARITY);
 
     if (o instanceof String) {
       try {
-        return OBJECT_MAPPER.readValue((String) o, Granularity.class);
+        return objectMapper.readValue((String) o, Granularity.class);
       }
       catch (JsonProcessingException e) {
         throw new ISE("Invalid segment granularity [%s]", o);
@@ -188,9 +188,10 @@ public static RowSignature sortableSignature(
    * @throws IllegalArgumentException if the provided granularity is not supported
    */
   @Nullable
-  public static VirtualColumn makeSegmentGranularityVirtualColumn(final Query<?> query)
+  public static VirtualColumn makeSegmentGranularityVirtualColumn(final ObjectMapper jsonMapper, final Query<?> query)
   {
-    final Granularity segmentGranularity = QueryKitUtils.getSegmentGranularityFromContext(query.getContext());
+    final Granularity segmentGranularity =
+        QueryKitUtils.getSegmentGranularityFromContext(jsonMapper, query.getContext());
     final String timeColumnName = query.context().getString(QueryKitUtils.CTX_TIME_COLUMN_NAME);
 
     if (timeColumnName == null || Granularities.ALL.equals(segmentGranularity)) {
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessor.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessor.java
index a44c14e3cdc2..207fe53de03a 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessor.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessor.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.msq.querykit.groupby;
 
+import com.fasterxml.jackson.databind.ObjectMapper;
 import it.unimi.dsi.fastutil.ints.IntSet;
 import org.apache.druid.frame.Frame;
 import org.apache.druid.frame.FrameType;
@@ -92,7 +93,8 @@ public GroupByPostShuffleFrameProcessor(
       final FrameReader frameReader,
       final RowSignature resultSignature,
       final ClusterBy clusterBy,
-      final MemoryAllocator allocator
+      final MemoryAllocator allocator,
+      final ObjectMapper jsonMapper
   )
   {
     this.query = query;
@@ -107,7 +109,7 @@ public GroupByPostShuffleFrameProcessor(
     this.finalizeFn = makeFinalizeFn(query);
     this.havingSpec = cloneHavingSpec(query);
     this.columnSelectorFactoryForFrameWriter =
-        makeVirtualColumnsForFrameWriter(query).wrap(
+        makeVirtualColumnsForFrameWriter(jsonMapper, query).wrap(
             RowBasedGrouperHelper.createResultRowBasedColumnSelectorFactory(
                 query,
                 () -> outputRow,
@@ -311,9 +313,13 @@ private static HavingSpec cloneHavingSpec(final GroupByQuery query)
    * Create virtual columns containing "bonus" fields that should be attached to the {@link FrameWriter} for
    * this processor. Kept in sync with the signature generated by {@link GroupByQueryKit}.
    */
-  private static VirtualColumns makeVirtualColumnsForFrameWriter(final GroupByQuery query)
+  private static VirtualColumns makeVirtualColumnsForFrameWriter(
+      final ObjectMapper jsonMapper,
+      final GroupByQuery query
+  )
   {
-    final VirtualColumn segmentGranularityVirtualColumn = QueryKitUtils.makeSegmentGranularityVirtualColumn(query);
+    final VirtualColumn segmentGranularityVirtualColumn =
+        QueryKitUtils.makeSegmentGranularityVirtualColumn(jsonMapper, query);
 
     if (segmentGranularityVirtualColumn == null) {
       return VirtualColumns.EMPTY;
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessorFactory.java
index 5987eb02fae0..ffb8bacf5e62 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByPostShuffleFrameProcessorFactory.java
@@ -118,7 +118,8 @@ public ProcessorsAndChannels<FrameProcessor<Long>, Long> makeProcessors(
               readableInput.getChannelFrameReader(),
               stageDefinition.getSignature(),
               stageDefinition.getClusterBy(),
-              outputChannel.getFrameMemoryAllocator()
+              outputChannel.getFrameMemoryAllocator(),
+              frameContext.jsonMapper()
           );
         }
     );
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByQueryKit.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByQueryKit.java
index 411fe118a29e..402d2dfa3d8c 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByQueryKit.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/groupby/GroupByQueryKit.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.msq.querykit.groupby;
 
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.base.Preconditions;
 import org.apache.druid.frame.key.ClusterBy;
 import org.apache.druid.frame.key.SortColumn;
@@ -56,6 +57,13 @@
 
 public class GroupByQueryKit implements QueryKit<GroupByQuery>
 {
+  private final ObjectMapper jsonMapper;
+
+  public GroupByQueryKit(ObjectMapper jsonMapper)
+  {
+    this.jsonMapper = jsonMapper;
+  }
+
   @Override
   public QueryDefinition makeQueryDefinition(
       final String queryId,
@@ -85,7 +93,8 @@ public QueryDefinition makeQueryDefinition(
     final GroupByQuery queryToRun = (GroupByQuery) originalQuery.withDataSource(dataSourcePlan.getNewDataSource());
     final int firstStageNumber = Math.max(minStageNumber, queryDefBuilder.getNextStageNumber());
 
-    final Granularity segmentGranularity = QueryKitUtils.getSegmentGranularityFromContext(queryToRun.getContext());
+    final Granularity segmentGranularity =
+        QueryKitUtils.getSegmentGranularityFromContext(jsonMapper, queryToRun.getContext());
     final RowSignature intermediateSignature = computeIntermediateSignature(queryToRun);
     final ClusterBy resultClusterBy =
         QueryKitUtils.clusterByWithSegmentGranularity(computeClusterByForResults(queryToRun), segmentGranularity);
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessor.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessor.java
index 307d274c73bf..0482e2715dc7 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessor.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessor.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.msq.querykit.scan;
 
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.base.Preconditions;
 import com.google.common.collect.Iterables;
 import it.unimi.dsi.fastutil.ints.Int2ObjectMap;
@@ -92,7 +93,8 @@ public ScanQueryFrameProcessor(
       final ResourceHolder<WritableFrameChannel> outputChannel,
       final ResourceHolder<FrameWriterFactory> frameWriterFactoryHolder,
       @Nullable final AtomicLong runningCountForLimit,
-      final long memoryReservedForBroadcastJoin
+      final long memoryReservedForBroadcastJoin,
+      final ObjectMapper jsonMapper
   )
   {
     super(
@@ -111,7 +113,8 @@ public ScanQueryFrameProcessor(
     final List<VirtualColumn> frameWriterVirtualColumns = new ArrayList<>();
     frameWriterVirtualColumns.add(partitionBoostVirtualColumn);
 
-    final VirtualColumn segmentGranularityVirtualColumn = QueryKitUtils.makeSegmentGranularityVirtualColumn(query);
+    final VirtualColumn segmentGranularityVirtualColumn =
+        QueryKitUtils.makeSegmentGranularityVirtualColumn(jsonMapper, query);
 
     if (segmentGranularityVirtualColumn != null) {
       frameWriterVirtualColumns.add(segmentGranularityVirtualColumn);
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorFactory.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorFactory.java
index 2a948fd45625..bda53af69641 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorFactory.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorFactory.java
@@ -100,7 +100,8 @@ protected FrameProcessor<Long> makeProcessor(
             allocatorHolder
         )),
         runningCountForLimit,
-        frameContext.memoryParameters().getBroadcastJoinMemory()
+        frameContext.memoryParameters().getBroadcastJoinMemory(),
+        frameContext.jsonMapper()
     );
   }
 }
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryKit.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryKit.java
index 5bfb70b52c91..9e44f152eb2d 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryKit.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/querykit/scan/ScanQueryKit.java
@@ -116,7 +116,8 @@ public QueryDefinition makeQueryDefinition(
       signatureToUse = scanSignature;
     } else {
       final RowSignature.Builder signatureBuilder = RowSignature.builder().addAll(scanSignature);
-      final Granularity segmentGranularity = QueryKitUtils.getSegmentGranularityFromContext(queryToRun.getContext());
+      final Granularity segmentGranularity =
+          QueryKitUtils.getSegmentGranularityFromContext(jsonMapper, queryToRun.getContext());
       final List<SortColumn> clusterByColumns = new ArrayList<>();
 
       // Add regular orderBys.
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/sql/MSQTaskSqlEngine.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/sql/MSQTaskSqlEngine.java
index a91844114dda..2ec08e03783d 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/sql/MSQTaskSqlEngine.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/sql/MSQTaskSqlEngine.java
@@ -207,6 +207,7 @@ private static void validateInsert(
 
     try {
       segmentGranularity = QueryKitUtils.getSegmentGranularityFromContext(
+          plannerContext.getJsonMapper(),
           plannerContext.queryContextMap()
       );
     }
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollectorImpl.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollectorImpl.java
index 13ab5dc01cee..bd010c555f17 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollectorImpl.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsCollectorImpl.java
@@ -35,6 +35,7 @@
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.Comparator;
+import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.SortedMap;
@@ -56,7 +57,7 @@ public class ClusterByStatisticsCollectorImpl implements ClusterByStatisticsColl
 
   private final boolean[] hasMultipleValues;
 
-  private final int maxRetainedBytes;
+  private final long maxRetainedBytes;
   private final int maxBuckets;
   private long totalRetainedBytes;
 
@@ -64,7 +65,7 @@ private ClusterByStatisticsCollectorImpl(
       final ClusterBy clusterBy,
       final RowKeyReader keyReader,
       final KeyCollectorFactory<?, ?> keyCollectorFactory,
-      final int maxRetainedBytes,
+      final long maxRetainedBytes,
       final int maxBuckets,
       final boolean checkHasMultipleValues
   )
@@ -86,7 +87,7 @@ private ClusterByStatisticsCollectorImpl(
   public static ClusterByStatisticsCollector create(
       final ClusterBy clusterBy,
       final RowSignature signature,
-      final int maxRetainedBytes,
+      final long maxRetainedBytes,
       final int maxBuckets,
       final boolean aggregate,
       final boolean checkHasMultipleValues
@@ -167,7 +168,7 @@ public ClusterByStatisticsCollector addAll(final ClusterByStatisticsCollector ot
   public ClusterByStatisticsCollector addAll(final ClusterByStatisticsSnapshot snapshot)
   {
     // Add all key collectors from the other collector.
-    for (ClusterByStatisticsSnapshot.Bucket otherBucket : snapshot.getBuckets()) {
+    for (ClusterByStatisticsSnapshot.Bucket otherBucket : snapshot.getBuckets().values()) {
       //noinspection rawtypes, unchecked
       final KeyCollector<?> otherKeyCollector =
           ((KeyCollectorFactory) keyCollectorFactory).fromSnapshot(otherBucket.getKeyCollectorSnapshot());
@@ -315,13 +316,20 @@ public ClusterByStatisticsSnapshot snapshot()
   {
     assertRetainedByteCountsAreTrackedCorrectly();
 
-    final List<ClusterByStatisticsSnapshot.Bucket> bucketSnapshots = new ArrayList<>();
+    final Map<Long, ClusterByStatisticsSnapshot.Bucket> bucketSnapshots = new HashMap<>();
+    final RowKeyReader trimmedRowReader = keyReader.trimmedKeyReader(clusterBy.getBucketByCount());
 
     for (final Map.Entry<RowKey, BucketHolder> bucketEntry : buckets.entrySet()) {
       //noinspection rawtypes, unchecked
       final KeyCollectorSnapshot keyCollectorSnapshot =
           ((KeyCollectorFactory) keyCollectorFactory).toSnapshot(bucketEntry.getValue().keyCollector);
-      bucketSnapshots.add(new ClusterByStatisticsSnapshot.Bucket(bucketEntry.getKey(), keyCollectorSnapshot));
+      Long bucketKey = Long.MIN_VALUE;
+
+      // If there is a clustering on time, read the first field from each bucket and add it to the snapshots.
+      if (clusterBy.getBucketByCount() == 1) {
+        bucketKey = (Long) trimmedRowReader.read(bucketEntry.getKey(), 0);
+      }
+      bucketSnapshots.put(bucketKey, new ClusterByStatisticsSnapshot.Bucket(bucketEntry.getKey(), keyCollectorSnapshot, totalRetainedBytes));
     }
 
     final IntSet hasMultipleValuesSet;
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsSnapshot.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsSnapshot.java
index 6b16890254a0..e54253ad2186 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsSnapshot.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/ClusterByStatisticsSnapshot.java
@@ -23,22 +23,23 @@
 import com.fasterxml.jackson.annotation.JsonInclude;
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.google.common.base.Preconditions;
+import com.google.common.collect.ImmutableMap;
 import org.apache.druid.frame.key.RowKey;
 
 import javax.annotation.Nullable;
 import java.util.Collections;
-import java.util.List;
+import java.util.Map;
 import java.util.Objects;
 import java.util.Set;
 
 public class ClusterByStatisticsSnapshot
 {
-  private final List<Bucket> buckets;
+  private final Map<Long, Bucket> buckets;
   private final Set<Integer> hasMultipleValues;
 
   @JsonCreator
   ClusterByStatisticsSnapshot(
-      @JsonProperty("buckets") final List<Bucket> buckets,
+      @JsonProperty("buckets") final Map<Long, Bucket> buckets,
       @JsonProperty("hasMultipleValues") @Nullable final Set<Integer> hasMultipleValues
   )
   {
@@ -48,15 +49,21 @@ public class ClusterByStatisticsSnapshot
 
   public static ClusterByStatisticsSnapshot empty()
   {
-    return new ClusterByStatisticsSnapshot(Collections.emptyList(), null);
+    return new ClusterByStatisticsSnapshot(Collections.emptyMap(), null);
   }
 
   @JsonProperty("buckets")
-  List<Bucket> getBuckets()
+  Map<Long, Bucket> getBuckets()
   {
     return buckets;
   }
 
+  public ClusterByStatisticsSnapshot getSnapshotForTimeChunk(long timeChunk)
+  {
+    Bucket bucket = buckets.get(timeChunk);
+    return new ClusterByStatisticsSnapshot(ImmutableMap.of(timeChunk, bucket), null);
+  }
+
   @JsonProperty("hasMultipleValues")
   @JsonInclude(JsonInclude.Include.NON_EMPTY)
   Set<Integer> getHasMultipleValues()
@@ -64,6 +71,15 @@ Set<Integer> getHasMultipleValues()
     return hasMultipleValues;
   }
 
+  public PartialKeyStatisticsInformation partialKeyStatistics()
+  {
+    double bytesRetained = 0;
+    for (ClusterByStatisticsSnapshot.Bucket bucket : buckets.values()) {
+      bytesRetained += bucket.bytesRetained;
+    }
+    return new PartialKeyStatisticsInformation(buckets.keySet(), !getHasMultipleValues().isEmpty(), bytesRetained);
+  }
+
   @Override
   public boolean equals(Object o)
   {
@@ -86,16 +102,19 @@ public int hashCode()
   static class Bucket
   {
     private final RowKey bucketKey;
+    private final double bytesRetained;
     private final KeyCollectorSnapshot keyCollectorSnapshot;
 
     @JsonCreator
     Bucket(
         @JsonProperty("bucketKey") RowKey bucketKey,
-        @JsonProperty("data") KeyCollectorSnapshot keyCollectorSnapshot
+        @JsonProperty("data") KeyCollectorSnapshot keyCollectorSnapshot,
+        @JsonProperty("bytesRetained") double bytesRetained
     )
     {
       this.bucketKey = Preconditions.checkNotNull(bucketKey, "bucketKey");
       this.keyCollectorSnapshot = Preconditions.checkNotNull(keyCollectorSnapshot, "data");
+      this.bytesRetained = bytesRetained;
     }
 
     @JsonProperty
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/CompleteKeyStatisticsInformation.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/CompleteKeyStatisticsInformation.java
new file mode 100644
index 000000000000..8a915fc8cd8e
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/CompleteKeyStatisticsInformation.java
@@ -0,0 +1,82 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.statistics;
+
+import com.google.common.collect.ImmutableSortedMap;
+
+import java.util.HashSet;
+import java.util.Set;
+import java.util.SortedMap;
+
+/**
+ * Class maintained by the controller to merge {@link PartialKeyStatisticsInformation} sent by the worker.
+ */
+public class CompleteKeyStatisticsInformation
+{
+  private final SortedMap<Long, Set<Integer>> timeSegmentVsWorkerMap;
+
+  private boolean multipleValues;
+
+  private double bytesRetained;
+
+  public CompleteKeyStatisticsInformation(
+      final SortedMap<Long, Set<Integer>> timeChunks,
+      boolean multipleValues,
+      double bytesRetained
+  )
+  {
+    this.timeSegmentVsWorkerMap = timeChunks;
+    this.multipleValues = multipleValues;
+    this.bytesRetained = bytesRetained;
+  }
+
+  /**
+   * Merges the {@link PartialKeyStatisticsInformation} into the complete key statistics information object.
+   * {@link #timeSegmentVsWorkerMap} is updated in sorted order with the timechunks from
+   * {@param partialKeyStatisticsInformation}, {@link #multipleValues} is set to true if
+   * {@param partialKeyStatisticsInformation} contains multipleValues and the bytes retained by the partial sketch
+   * is added to {@link #bytesRetained}.
+   */
+  public void mergePartialInformation(int workerNumber, PartialKeyStatisticsInformation partialKeyStatisticsInformation)
+  {
+    for (Long timeSegment : partialKeyStatisticsInformation.getTimeSegments()) {
+      this.timeSegmentVsWorkerMap
+          .computeIfAbsent(timeSegment, key -> new HashSet<>())
+          .add(workerNumber);
+    }
+    this.multipleValues = this.multipleValues || partialKeyStatisticsInformation.hasMultipleValues();
+    this.bytesRetained += bytesRetained;
+  }
+
+  public SortedMap<Long, Set<Integer>> getTimeSegmentVsWorkerMap()
+  {
+    return ImmutableSortedMap.copyOfSorted(timeSegmentVsWorkerMap);
+  }
+
+  public boolean hasMultipleValues()
+  {
+    return multipleValues;
+  }
+
+  public double getBytesRetained()
+  {
+    return bytesRetained;
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/DelegateOrMinKeyCollectorSnapshot.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/DelegateOrMinKeyCollectorSnapshot.java
index f0191da126b2..5e8da8df0c22 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/DelegateOrMinKeyCollectorSnapshot.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/DelegateOrMinKeyCollectorSnapshot.java
@@ -22,16 +22,19 @@
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonInclude;
 import com.fasterxml.jackson.annotation.JsonProperty;
+import com.fasterxml.jackson.annotation.JsonTypeName;
 import org.apache.druid.frame.key.RowKey;
 import org.apache.druid.java.util.common.ISE;
 
 import javax.annotation.Nullable;
 import java.util.Objects;
 
+@JsonTypeName(DelegateOrMinKeyCollectorSnapshot.TYPE)
 public class DelegateOrMinKeyCollectorSnapshot<T extends KeyCollectorSnapshot> implements KeyCollectorSnapshot
 {
   static final String FIELD_SNAPSHOT = "snapshot";
   static final String FIELD_MIN_KEY = "minKey";
+  static final String TYPE = "delegate";
 
   private final T snapshot;
   private final RowKey minKey;
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/DistinctKeySnapshot.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/DistinctKeySnapshot.java
index 44b95d3874f6..47d46f72cabb 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/DistinctKeySnapshot.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/DistinctKeySnapshot.java
@@ -22,6 +22,7 @@
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonInclude;
 import com.fasterxml.jackson.annotation.JsonProperty;
+import com.fasterxml.jackson.annotation.JsonTypeName;
 import com.google.common.base.Preconditions;
 import org.apache.druid.collections.SerializablePair;
 import org.apache.druid.frame.key.RowKey;
@@ -31,8 +32,10 @@
 import java.util.Map;
 import java.util.Objects;
 
+@JsonTypeName(DistinctKeySnapshot.TYPE)
 public class DistinctKeySnapshot implements KeyCollectorSnapshot
 {
+  static final String TYPE = "distinct";
   private final List<SerializablePair<RowKey, Long>> keys;
   private final int spaceReductionFactor;
 
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/KeyCollectorSnapshot.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/KeyCollectorSnapshot.java
index ad359cb1e60e..d1e717c37ec9 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/KeyCollectorSnapshot.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/KeyCollectorSnapshot.java
@@ -19,9 +19,18 @@
 
 package org.apache.druid.msq.statistics;
 
+import com.fasterxml.jackson.annotation.JsonSubTypes;
+import com.fasterxml.jackson.annotation.JsonTypeInfo;
+
 /**
  * Marker interface for deserialization.
  */
+@JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "collectorType")
+@JsonSubTypes(value = {
+    @JsonSubTypes.Type(name = DelegateOrMinKeyCollectorSnapshot.TYPE, value = DelegateOrMinKeyCollectorSnapshot.class),
+    @JsonSubTypes.Type(name = QuantilesSketchKeyCollectorSnapshot.TYPE, value = QuantilesSketchKeyCollectorSnapshot.class),
+    @JsonSubTypes.Type(name = DistinctKeySnapshot.TYPE, value = DistinctKeySnapshot.class),
+})
 public interface KeyCollectorSnapshot
 {
 }
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/PartialKeyStatisticsInformation.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/PartialKeyStatisticsInformation.java
new file mode 100644
index 000000000000..535af8dafb0a
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/PartialKeyStatisticsInformation.java
@@ -0,0 +1,67 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.statistics;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.Set;
+
+/**
+ * Class sent by worker to controller after reading input to generate partition boundries.
+ */
+public class PartialKeyStatisticsInformation
+{
+  private final Set<Long> timeSegments;
+
+  private final boolean multipleValues;
+
+  private final double bytesRetained;
+
+  @JsonCreator
+  public PartialKeyStatisticsInformation(
+      @JsonProperty("timeSegments") Set<Long> timeSegments,
+      @JsonProperty("multipleValues") boolean hasMultipleValues,
+      @JsonProperty("bytesRetained") double bytesRetained
+  )
+  {
+    this.timeSegments = timeSegments;
+    this.multipleValues = hasMultipleValues;
+    this.bytesRetained = bytesRetained;
+  }
+
+  @JsonProperty("timeSegments")
+  public Set<Long> getTimeSegments()
+  {
+    return timeSegments;
+  }
+
+  @JsonProperty("multipleValues")
+  public boolean hasMultipleValues()
+  {
+    return multipleValues;
+  }
+
+  @JsonProperty("bytesRetained")
+  public double getBytesRetained()
+  {
+    return bytesRetained;
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/QuantilesSketchKeyCollectorSnapshot.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/QuantilesSketchKeyCollectorSnapshot.java
index 1b555ac3f944..5784afd49a0f 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/QuantilesSketchKeyCollectorSnapshot.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/statistics/QuantilesSketchKeyCollectorSnapshot.java
@@ -21,11 +21,14 @@
 
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonProperty;
+import com.fasterxml.jackson.annotation.JsonTypeName;
 
 import java.util.Objects;
 
+@JsonTypeName(QuantilesSketchKeyCollectorSnapshot.TYPE)
 public class QuantilesSketchKeyCollectorSnapshot implements KeyCollectorSnapshot
 {
+  static final String TYPE = "quantile";
   private final String encodedSketch;
 
   private final double averageKeyLength;
diff --git a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
index c7c61fd30c76..7c589f2326f1 100644
--- a/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
+++ b/extensions-core/multi-stage-query/src/main/java/org/apache/druid/msq/util/MultiStageQueryContext.java
@@ -25,6 +25,7 @@
 import com.google.common.annotations.VisibleForTesting;
 import com.opencsv.RFC4180Parser;
 import com.opencsv.RFC4180ParserBuilder;
+import org.apache.druid.msq.exec.ClusterStatisticsMergeMode;
 import org.apache.druid.msq.kernel.WorkerAssignmentStrategy;
 import org.apache.druid.msq.sql.MSQMode;
 import org.apache.druid.query.QueryContext;
@@ -58,6 +59,8 @@ public class MultiStageQueryContext
   private static final boolean DEFAULT_FINALIZE_AGGREGATIONS = true;
 
   public static final String CTX_ENABLE_DURABLE_SHUFFLE_STORAGE = "durableShuffleStorage";
+  public static final String CTX_CLUSTER_STATISTICS_MERGE_MODE = "clusterStatisticsMergeMode";
+  public static final String DEFAULT_CLUSTER_STATISTICS_MERGE_MODE = ClusterStatisticsMergeMode.AUTO.toString();
   private static final boolean DEFAULT_ENABLE_DURABLE_SHUFFLE_STORAGE = false;
 
   public static final String CTX_DESTINATION = "destination";
@@ -93,6 +96,18 @@ public static boolean isDurableStorageEnabled(final QueryContext queryContext)
     );
   }
 
+  public static ClusterStatisticsMergeMode getClusterStatisticsMergeMode(QueryContext queryContext)
+  {
+    return ClusterStatisticsMergeMode.valueOf(
+        String.valueOf(
+            queryContext.getString(
+                CTX_CLUSTER_STATISTICS_MERGE_MODE,
+                DEFAULT_CLUSTER_STATISTICS_MERGE_MODE
+            )
+        )
+    );
+  }
+
   public static boolean isFinalizeAggregations(final QueryContext queryContext)
   {
     return queryContext.getBoolean(
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java
new file mode 100644
index 000000000000..51d0c1b83d76
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQFaultsTest.java
@@ -0,0 +1,351 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.exec;
+
+import com.google.common.collect.ImmutableMap;
+import com.google.common.collect.ImmutableSet;
+import org.apache.druid.indexing.common.actions.RetrieveUsedSegmentsAction;
+import org.apache.druid.indexing.common.actions.SegmentAllocateAction;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.msq.indexing.error.InsertCannotAllocateSegmentFault;
+import org.apache.druid.msq.indexing.error.InsertCannotBeEmptyFault;
+import org.apache.druid.msq.indexing.error.InsertCannotOrderByDescendingFault;
+import org.apache.druid.msq.indexing.error.InsertCannotReplaceExistingSegmentFault;
+import org.apache.druid.msq.indexing.error.InsertTimeNullFault;
+import org.apache.druid.msq.indexing.error.InsertTimeOutOfBoundsFault;
+import org.apache.druid.msq.indexing.error.TooManyClusteredByColumnsFault;
+import org.apache.druid.msq.indexing.error.TooManyColumnsFault;
+import org.apache.druid.msq.indexing.error.TooManyInputFilesFault;
+import org.apache.druid.msq.indexing.error.TooManyPartitionsFault;
+import org.apache.druid.msq.indexing.error.UnknownFault;
+import org.apache.druid.msq.test.MSQTestBase;
+import org.apache.druid.msq.test.MSQTestFileUtils;
+import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.column.RowSignature;
+import org.apache.druid.timeline.DataSegment;
+import org.apache.druid.timeline.SegmentId;
+import org.junit.Test;
+import org.mockito.Mockito;
+
+import java.io.File;
+import java.io.IOException;
+import java.util.Collections;
+import java.util.Map;
+import java.util.stream.Collectors;
+import java.util.stream.IntStream;
+
+import static org.mockito.ArgumentMatchers.isA;
+
+public class MSQFaultsTest extends MSQTestBase
+{
+  @Test
+  public void testInsertCannotAllocateSegmentFault()
+  {
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("dim1", ColumnType.STRING)
+                                            .add("cnt", ColumnType.LONG).build();
+
+    // If there is some problem allocating the segment,task action client will return a null value.
+    Mockito.doReturn(null).when(testTaskActionClient).submit(isA(SegmentAllocateAction.class));
+
+    testIngestQuery().setSql(
+                         "insert into foo1 select  __time, dim1 , count(*) as cnt from foo where dim1 is not null and __time >= TIMESTAMP '2000-01-02 00:00:00' and __time < TIMESTAMP '2000-01-03 00:00:00' group by 1, 2 PARTITIONED by day clustered by dim1")
+                     .setExpectedDataSource("foo1")
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedMSQFault(
+                         new InsertCannotAllocateSegmentFault(
+                             "foo1",
+                             Intervals.of("2000-01-02T00:00:00.000Z/2000-01-03T00:00:00.000Z")
+                         )
+                     )
+                     .verifyResults();
+  }
+
+  @Test
+  public void testInsertCannotBeEmptyFault()
+  {
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("dim1", ColumnType.STRING)
+                                            .add("cnt", ColumnType.LONG).build();
+
+    //Insert with a condition which results in 0 rows being inserted
+    testIngestQuery().setSql(
+                         "insert into foo1 select  __time, dim1 , count(*) as cnt from foo where dim1 is not null and __time < TIMESTAMP '1971-01-01 00:00:00' group by 1, 2 PARTITIONED by day clustered by dim1")
+                     .setExpectedDataSource("foo1")
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedMSQFault(new InsertCannotBeEmptyFault("foo1"))
+                     .verifyResults();
+  }
+
+  @Test
+  public void testInsertCannotOrderByDescendingFault()
+  {
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("dim1", ColumnType.STRING)
+                                            .add("cnt", ColumnType.LONG).build();
+
+    // Add an DESC clustered by column, which should not be allowed
+    testIngestQuery().setSql(
+                         "insert into foo1 select  __time, dim1 , count(*) as cnt from foo where dim1 is not null and __time < TIMESTAMP '2000-01-02 00:00:00' group by 1, 2 PARTITIONED by day clustered by dim1 DESC")
+                     .setExpectedDataSource("foo1")
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedMSQFault(new InsertCannotOrderByDescendingFault("d1"))
+                     .verifyResults();
+  }
+
+  @Test
+  public void testInsertCannotReplaceExistingSegmentFault()
+  {
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("dim1", ColumnType.STRING)
+                                            .add("cnt", ColumnType.LONG).build();
+
+    // Create a datasegment which lies partially outside the generated segment
+    DataSegment existingDataSegment = DataSegment.builder()
+                                   .interval(Intervals.of("2001-01-01T/2003-01-04T"))
+                                   .size(50)
+                                   .version("1").dataSource("foo1")
+                                   .build();
+    Mockito.doReturn(ImmutableSet.of(existingDataSegment)).when(testTaskActionClient).submit(isA(RetrieveUsedSegmentsAction.class));
+
+    testIngestQuery().setSql(
+                         "replace into foo1 overwrite where __time >= TIMESTAMP '2000-01-01 00:00:00' and __time < TIMESTAMP '2002-01-03 00:00:00' select  __time, dim1 , count(*) as cnt from foo where dim1 is not null group by 1, 2 PARTITIONED by day clustered by dim1")
+                     .setExpectedDataSource("foo1")
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedMSQFault(new InsertCannotReplaceExistingSegmentFault(existingDataSegment.getId()))
+                     .verifyResults();
+  }
+
+  @Test
+  public void testInsertTimeOutOfBoundsFault()
+  {
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("dim1", ColumnType.STRING)
+                                            .add("cnt", ColumnType.LONG).build();
+
+    // Add a REPLACE statement which replaces a different partition than the ones which rows are present for. The generated
+    // partition will be outside the replace interval which should throw an InsertTimeOutOfBoundsFault.
+    testIngestQuery().setSql(
+                         "replace into foo1 overwrite where __time >= TIMESTAMP '2002-01-02 00:00:00' and __time < TIMESTAMP '2002-01-03 00:00:00' select  __time, dim1 , count(*) as cnt from foo where dim1 is not null group by 1, 2 PARTITIONED by day clustered by dim1")
+                     .setExpectedDataSource("foo1")
+                     .setExpectedRowSignature(rowSignature)
+                     .setExpectedMSQFault(new InsertTimeOutOfBoundsFault(Intervals.of("2000-01-02T00:00:00.000Z/2000-01-03T00:00:00.000Z")))
+                     .verifyResults();
+  }
+
+  @Test
+  public void testInsertTimeNullFault()
+  {
+    final RowSignature rowSignature =
+        RowSignature.builder()
+                    .add("__time", ColumnType.LONG)
+                    .add("dim1", ColumnType.STRING)
+                    .build();
+
+    testIngestQuery()
+        .setSql(
+            "INSERT INTO foo1\n"
+            + "SELECT TIME_PARSE(dim1) AS __time, dim1 as cnt\n"
+            + "FROM foo\n"
+            + "PARTITIONED BY DAY\n"
+            + "CLUSTERED BY dim1")
+        .setExpectedDataSource("foo1")
+        .setExpectedRowSignature(rowSignature)
+        .setExpectedSegment(ImmutableSet.of(SegmentId.of("foo", Intervals.of("2000-01-01T/P1M"), "test", 0)))
+        .setExpectedMSQFault(InsertTimeNullFault.instance())
+        .verifyResults();
+  }
+
+  @Test
+  public void testInsertWithTooManySegments() throws IOException
+  {
+    Map<String, Object> context = ImmutableMap.<String, Object>builder()
+                                              .putAll(DEFAULT_MSQ_CONTEXT)
+                                              .put("rowsPerSegment", 1)
+                                              .build();
+
+
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .build();
+
+    File file = MSQTestFileUtils.generateTemporaryNdJsonFile(30000, 1);
+    String filePathAsJson = queryFramework().queryJsonMapper().writeValueAsString(file.getAbsolutePath());
+
+    testIngestQuery().setSql(" insert into foo1 SELECT\n"
+                             + "  floor(TIME_PARSE(\"timestamp\") to day) AS __time\n"
+                             + "FROM TABLE(\n"
+                             + "  EXTERN(\n"
+                             + "    '{ \"files\": [" + filePathAsJson + "],\"type\":\"local\"}',\n"
+                             + "    '{\"type\": \"json\"}',\n"
+                             + "    '[{\"name\": \"timestamp\",\"type\":\"string\"}]'\n"
+                             + "  )\n"
+                             + ") PARTITIONED by day")
+                     .setExpectedDataSource("foo1")
+                     .setExpectedRowSignature(rowSignature)
+                     .setQueryContext(context)
+                     .setExpectedMSQFault(new TooManyPartitionsFault(25000))
+                     .verifyResults();
+
+  }
+
+  @Test
+  public void testInsertWithUnsupportedColumnType()
+  {
+    RowSignature dummyRowSignature = RowSignature.builder().add("__time", ColumnType.LONG).build();
+
+    testIngestQuery()
+        .setSql(StringUtils.format(
+            " insert into foo1 SELECT\n"
+            + "  floor(TIME_PARSE(\"timestamp\") to day) AS __time,\n"
+            + " col1\n"
+            + "FROM TABLE(\n"
+            + "  EXTERN(\n"
+            + "    '{ \"files\": [\"ignored\"],\"type\":\"local\"}',\n"
+            + "    '{\"type\": \"json\"}',\n"
+            + "    '[{\"name\": \"timestamp\", \"type\": \"string\"},{\"name\": \"col1\", \"type\": \"long_array\"} ]'\n"
+            + "  )\n"
+            + ") PARTITIONED by day"
+        ))
+        .setExpectedDataSource("foo1")
+        .setExpectedRowSignature(dummyRowSignature)
+        .setExpectedMSQFault(UnknownFault.forMessage(
+            "org.apache.druid.java.util.common.ISE: Cannot create dimension for type [ARRAY<LONG>]"))
+        .verifyResults();
+  }
+
+  @Test
+  public void testInsertWithManyColumns()
+  {
+    RowSignature dummyRowSignature = RowSignature.builder().add("__time", ColumnType.LONG).build();
+
+    final int numColumns = 2000;
+
+    String columnNames = IntStream.range(1, numColumns)
+                                  .mapToObj(i -> "col" + i).collect(Collectors.joining(", "));
+
+    String externSignature = IntStream.range(1, numColumns)
+                                      .mapToObj(i -> StringUtils.format(
+                                          "{\"name\": \"col%d\", \"type\": \"string\"}",
+                                          i
+                                      ))
+                                      .collect(Collectors.joining(", "));
+
+    testIngestQuery()
+        .setSql(StringUtils.format(
+            " insert into foo1 SELECT\n"
+            + "  floor(TIME_PARSE(\"timestamp\") to day) AS __time,\n"
+            + " %s\n"
+            + "FROM TABLE(\n"
+            + "  EXTERN(\n"
+            + "    '{ \"files\": [\"ignored\"],\"type\":\"local\"}',\n"
+            + "    '{\"type\": \"json\"}',\n"
+            + "    '[{\"name\": \"timestamp\", \"type\": \"string\"}, %s]'\n"
+            + "  )\n"
+            + ") PARTITIONED by day",
+            columnNames,
+            externSignature
+        ))
+        .setExpectedDataSource("foo1")
+        .setExpectedRowSignature(dummyRowSignature)
+        .setExpectedMSQFault(new TooManyColumnsFault(numColumns + 2, 2000))
+        .verifyResults();
+  }
+
+  @Test
+  public void testInsertWithHugeClusteringKeys()
+  {
+    RowSignature dummyRowSignature = RowSignature.builder().add("__time", ColumnType.LONG).build();
+
+    final int numColumns = 1700;
+
+    String columnNames = IntStream.range(1, numColumns)
+                                  .mapToObj(i -> "col" + i).collect(Collectors.joining(", "));
+
+    String clusteredByClause = IntStream.range(1, numColumns + 1)
+                                        .mapToObj(String::valueOf)
+                                        .collect(Collectors.joining(", "));
+
+    String externSignature = IntStream.range(1, numColumns)
+                                      .mapToObj(i -> StringUtils.format(
+                                          "{\"name\": \"col%d\", \"type\": \"string\"}",
+                                          i
+                                      ))
+                                      .collect(Collectors.joining(", "));
+
+    testIngestQuery()
+        .setSql(StringUtils.format(
+            " insert into foo1 SELECT\n"
+            + "  floor(TIME_PARSE(\"timestamp\") to day) AS __time,\n"
+            + " %s\n"
+            + "FROM TABLE(\n"
+            + "  EXTERN(\n"
+            + "    '{ \"files\": [\"ignored\"],\"type\":\"local\"}',\n"
+            + "    '{\"type\": \"json\"}',\n"
+            + "    '[{\"name\": \"timestamp\", \"type\": \"string\"}, %s]'\n"
+            + "  )\n"
+            + ") PARTITIONED by day CLUSTERED BY %s",
+            columnNames,
+            externSignature,
+            clusteredByClause
+        ))
+        .setExpectedDataSource("foo1")
+        .setExpectedRowSignature(dummyRowSignature)
+        .setExpectedMSQFault(new TooManyClusteredByColumnsFault(numColumns + 2, 1500, 0))
+        .verifyResults();
+  }
+
+  @Test
+  public void testTooManyInputFiles() throws IOException
+  {
+    RowSignature dummyRowSignature = RowSignature.builder().add("__time", ColumnType.LONG).build();
+
+    final int numFiles = 20000;
+
+    final File toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/wikipedia-sampled.json");
+    final String toReadFileNameAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
+
+    String externalFiles = String.join(", ", Collections.nCopies(numFiles, toReadFileNameAsJson));
+
+    testIngestQuery()
+        .setSql(StringUtils.format(
+            "insert into foo1 SELECT\n"
+            + "  floor(TIME_PARSE(\"timestamp\") to day) AS __time\n"
+            + "FROM TABLE(\n"
+            + "  EXTERN(\n"
+            + "    '{ \"files\": [%s],\"type\":\"local\"}',\n"
+            + "    '{\"type\": \"csv\", \"hasHeaderRow\": true}',\n"
+            + "    '[{\"name\": \"timestamp\", \"type\": \"string\"}]'\n"
+            + "  )\n"
+            + ") PARTITIONED by day",
+            externalFiles
+        ))
+        .setExpectedDataSource("foo1")
+        .setExpectedRowSignature(dummyRowSignature)
+        .setExpectedMSQFault(new TooManyInputFilesFault(numFiles, Limits.MAX_INPUT_FILES_PER_WORKER, 2))
+        .verifyResults();
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java
index 64b9a8067240..f54d2fa880cb 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQInsertTest.java
@@ -27,13 +27,11 @@
 import org.apache.druid.hll.HyperLogLogCollector;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Intervals;
-import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.msq.indexing.error.ColumnNameRestrictedFault;
-import org.apache.druid.msq.indexing.error.InsertTimeNullFault;
 import org.apache.druid.msq.indexing.error.RowTooLargeFault;
-import org.apache.druid.msq.indexing.error.TooManyClusteredByColumnsFault;
 import org.apache.druid.msq.test.MSQTestBase;
+import org.apache.druid.msq.test.MSQTestFileUtils;
 import org.apache.druid.msq.util.MultiStageQueryContext;
 import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
 import org.apache.druid.query.aggregation.hyperloglog.HyperUniquesAggregatorFactory;
@@ -55,8 +53,6 @@
 import java.util.Map;
 import java.util.Set;
 import java.util.TreeSet;
-import java.util.stream.Collectors;
-import java.util.stream.IntStream;
 
 public class MSQInsertTest extends MSQTestBase
 {
@@ -83,7 +79,7 @@ public void testInsertOnFoo1()
   @Test
   public void testInsertOnExternalDataSource() throws IOException
   {
-    final File toRead = getResourceAsTemporaryFile("/wikipedia-sampled.json");
+    final File toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/wikipedia-sampled.json");
     final String toReadFileNameAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
 
     RowSignature rowSignature = RowSignature.builder()
@@ -308,7 +304,7 @@ public void testRollUpOnFoo1ComplexCol()
   @Test
   public void testRollUpOnExternalDataSource() throws IOException
   {
-    final File toRead = getResourceAsTemporaryFile("/wikipedia-sampled.json");
+    final File toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/wikipedia-sampled.json");
     final String toReadFileNameAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
 
     RowSignature rowSignature = RowSignature.builder()
@@ -344,7 +340,7 @@ public void testRollUpOnExternalDataSource() throws IOException
   @Test()
   public void testRollUpOnExternalDataSourceWithCompositeKey() throws IOException
   {
-    final File toRead = getResourceAsTemporaryFile("/wikipedia-sampled.json");
+    final File toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/wikipedia-sampled.json");
     final String toReadFileNameAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
 
     RowSignature rowSignature = RowSignature.builder()
@@ -386,29 +382,6 @@ public void testRollUpOnExternalDataSourceWithCompositeKey() throws IOException
 
   }
 
-  @Test
-  public void testInsertNullTimestamp()
-  {
-    final RowSignature rowSignature =
-        RowSignature.builder()
-                    .add("__time", ColumnType.LONG)
-                    .add("dim1", ColumnType.STRING)
-                    .build();
-
-    testIngestQuery()
-        .setSql(
-            "INSERT INTO foo1\n"
-            + "SELECT TIME_PARSE(dim1) AS __time, dim1 as cnt\n"
-            + "FROM foo\n"
-            + "PARTITIONED BY DAY\n"
-            + "CLUSTERED BY dim1")
-        .setExpectedDataSource("foo1")
-        .setExpectedRowSignature(rowSignature)
-        .setExpectedSegment(ImmutableSet.of(SegmentId.of("foo", Intervals.of("2000-01-01T/P1M"), "test", 0)))
-        .setExpectedMSQFault(InsertTimeNullFault.instance())
-        .verifyResults();
-  }
-
   @Test
   public void testInsertWrongTypeTimestamp()
   {
@@ -448,48 +421,6 @@ public void testIncorrectInsertQuery()
                      .verifyPlanningErrors();
   }
 
-  @Test
-  public void testInsertWithHugeClusteringKeys()
-  {
-    RowSignature dummyRowSignature = RowSignature.builder().add("__time", ColumnType.LONG).build();
-
-    final int numColumns = 1700;
-
-    String columnNames = IntStream.range(1, numColumns)
-                                  .mapToObj(i -> "col" + i).collect(Collectors.joining(", "));
-
-    String clusteredByClause = IntStream.range(1, numColumns + 1)
-                                        .mapToObj(String::valueOf)
-                                        .collect(Collectors.joining(", "));
-
-    String externSignature = IntStream.range(1, numColumns)
-                                      .mapToObj(i -> StringUtils.format(
-                                          "{\"name\": \"col%d\", \"type\": \"string\"}",
-                                          i
-                                      ))
-                                      .collect(Collectors.joining(", "));
-
-    testIngestQuery()
-        .setSql(StringUtils.format(
-            " insert into foo1 SELECT\n"
-            + "  floor(TIME_PARSE(\"timestamp\") to day) AS __time,\n"
-            + " %s\n"
-            + "FROM TABLE(\n"
-            + "  EXTERN(\n"
-            + "    '{ \"files\": [\"ignored\"],\"type\":\"local\"}',\n"
-            + "    '{\"type\": \"json\"}',\n"
-            + "    '[{\"name\": \"timestamp\", \"type\": \"string\"}, %s]'\n"
-            + "  )\n"
-            + ") PARTITIONED by day CLUSTERED BY %s",
-            columnNames,
-            externSignature,
-            clusteredByClause
-        ))
-        .setExpectedDataSource("foo1")
-        .setExpectedRowSignature(dummyRowSignature)
-        .setExpectedMSQFault(new TooManyClusteredByColumnsFault(numColumns + 2, 1500, 0))
-        .verifyResults();
-  }
 
   @Test
   public void testInsertRestrictedColumns()
@@ -542,7 +473,7 @@ public void testInsertQueryWithInvalidSubtaskCount()
   @Test
   public void testInsertWithTooLargeRowShouldThrowException() throws IOException
   {
-    final File toRead = getResourceAsTemporaryFile("/wikipedia-sampled.json");
+    final File toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/wikipedia-sampled.json");
     final String toReadFileNameAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
 
     Mockito.doReturn(500).when(workerMemoryParameters).getLargeFrameSize();
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
index b268b1dcf0d3..49bb7f6d090d 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQReplaceTest.java
@@ -23,6 +23,7 @@
 import com.google.common.collect.ImmutableSet;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.msq.test.MSQTestBase;
+import org.apache.druid.msq.test.MSQTestFileUtils;
 import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.sql.SqlPlanningException;
@@ -109,7 +110,7 @@ public void testReplaceOnFoo1WithAllExtern() throws IOException
                                             .add("__time", ColumnType.LONG)
                                             .add("cnt", ColumnType.LONG).build();
 
-    final File toRead = getResourceAsTemporaryFile("/wikipedia-sampled.json");
+    final File toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/wikipedia-sampled.json");
     final String toReadFileNameAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
 
     testIngestQuery().setSql(" REPLACE INTO foo1 OVERWRITE ALL SELECT "
@@ -147,7 +148,7 @@ public void testReplaceOnFoo1WithWhereExtern() throws IOException
                                             .add("__time", ColumnType.LONG)
                                             .add("user", ColumnType.STRING).build();
 
-    final File toRead = getResourceAsTemporaryFile("/wikipedia-sampled.json");
+    final File toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/wikipedia-sampled.json");
     final String toReadFileNameAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
 
     testIngestQuery().setSql(" REPLACE INTO foo1 OVERWRITE WHERE __time >= TIMESTAMP '2016-06-27 01:00:00.00' AND __time < TIMESTAMP '2016-06-27 02:00:00.00' "
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQSelectTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQSelectTest.java
index c83481757d8f..b6305e13542b 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQSelectTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/MSQSelectTest.java
@@ -31,8 +31,10 @@
 import org.apache.druid.msq.indexing.ColumnMappings;
 import org.apache.druid.msq.indexing.MSQSpec;
 import org.apache.druid.msq.indexing.MSQTuningConfig;
+import org.apache.druid.msq.indexing.error.CannotParseExternalDataFault;
 import org.apache.druid.msq.shuffle.DurableStorageUtils;
 import org.apache.druid.msq.test.MSQTestBase;
+import org.apache.druid.msq.test.MSQTestFileUtils;
 import org.apache.druid.query.InlineDataSource;
 import org.apache.druid.query.QueryDataSource;
 import org.apache.druid.query.TableDataSource;
@@ -732,7 +734,7 @@ public void testGroupByOrderByAggregationWithLimitAndOffset()
   @Test
   public void testExternSelect1() throws IOException
   {
-    final File toRead = getResourceAsTemporaryFile("/wikipedia-sampled.json");
+    final File toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/wikipedia-sampled.json");
     final String toReadAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
 
     RowSignature rowSignature = RowSignature.builder()
@@ -1253,6 +1255,63 @@ public void testGroupByOnFooWithDurableStoragePathAssertions() throws IOExceptio
                .write(ArgumentMatchers.endsWith("__success"));
   }
 
+  @Test
+  public void testMultiValueStringWithIncorrectType() throws IOException
+  {
+    final File toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/unparseable-mv-string-array.json");
+    final String toReadAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
+
+    RowSignature rowSignature = RowSignature.builder()
+                                            .add("__time", ColumnType.LONG)
+                                            .add("language", ColumnType.STRING_ARRAY)
+                                            .build();
+
+    final GroupByQuery expectedQuery =
+        GroupByQuery.builder()
+                    .setDataSource(CalciteTests.DATASOURCE1)
+                    .setInterval(querySegmentSpec(Filtration.eternity()))
+                    .setGranularity(Granularities.ALL)
+                    .setDimensions(dimensions(new DefaultDimensionSpec("__time", "d0", ColumnType.LONG)))
+                    .build();
+
+
+    testSelectQuery()
+        .setSql("WITH\n"
+                + "kttm_data AS (\n"
+                + "SELECT * FROM TABLE(\n"
+                + "  EXTERN(\n"
+                + "    '{ \"files\": [" + toReadAsJson + "],\"type\":\"local\"}',\n"
+                + "    '{\"type\":\"json\"}',\n"
+                + "    '[{\"name\":\"timestamp\",\"type\":\"string\"},{\"name\":\"agent_category\",\"type\":\"string\"},{\"name\":\"agent_type\",\"type\":\"string\"},{\"name\":\"browser\",\"type\":\"string\"},{\"name\":\"browser_version\",\"type\":\"string\"},{\"name\":\"city\",\"type\":\"string\"},{\"name\":\"continent\",\"type\":\"string\"},{\"name\":\"country\",\"type\":\"string\"},{\"name\":\"version\",\"type\":\"string\"},{\"name\":\"event_type\",\"type\":\"string\"},{\"name\":\"event_subtype\",\"type\":\"string\"},{\"name\":\"loaded_image\",\"type\":\"string\"},{\"name\":\"adblock_list\",\"type\":\"string\"},{\"name\":\"forwarded_for\",\"type\":\"string\"},{\"name\":\"language\",\"type\":\"string\"},{\"name\":\"number\",\"type\":\"long\"},{\"name\":\"os\",\"type\":\"string\"},{\"name\":\"path\",\"type\":\"string\"},{\"name\":\"platform\",\"type\":\"string\"},{\"name\":\"referrer\",\"type\":\"string\"},{\"name\":\"referrer_host\",\"type\":\"string\"},{\"name\":\"region\",\"type\":\"string\"},{\"name\":\"remote_address\",\"type\":\"string\"},{\"name\":\"screen\",\"type\":\"string\"},{\"name\":\"session\",\"type\":\"string\"},{\"name\":\"session_length\",\"type\":\"long\"},{\"name\":\"timezone\",\"type\":\"string\"},{\"name\":\"timezone_offset\",\"type\":\"long\"},{\"name\":\"window\",\"type\":\"string\"}]'\n"
+                + "  )\n"
+                + "))\n"
+                + "\n"
+                + "SELECT\n"
+                + "  FLOOR(TIME_PARSE(\"timestamp\") TO MINUTE) AS __time,\n"
+                + "  MV_TO_ARRAY(\"language\") AS \"language\"\n"
+                + "FROM kttm_data")
+        .setExpectedRowSignature(rowSignature)
+        .setExpectedResultRows(ImmutableList.of(
+            new Object[]{1566691200000L, ImmutableList.of("en")},
+            new Object[]{1566691200000L, ImmutableList.of("en", "es", "es-419", "es-MX")},
+            new Object[]{1566691200000L, ImmutableList.of("en", "es", "es-419", "es-US")}
+        ))
+        .setExpectedMSQSpec(
+            MSQSpec
+                .builder()
+                .query(expectedQuery)
+                .columnMappings(new ColumnMappings(
+                    ImmutableList.of(
+                        new ColumnMapping("d0", "__time"),
+                        new ColumnMapping("a0", "cnt")
+                    )
+                ))
+                .tuningConfig(MSQTuningConfig.defaultConfig())
+                .build())
+        .setExpectedMSQFault(new CannotParseExternalDataFault(
+            "Unable to add the row to the frame. Type conversion might be required."))
+        .verifyResults();
+  }
 
   @Nonnull
   private List<Object[]> expectedMultiValueFooRowsGroup()
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/WorkerSketchFetcherAutoModeTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/WorkerSketchFetcherAutoModeTest.java
new file mode 100644
index 000000000000..42f6f0437f59
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/WorkerSketchFetcherAutoModeTest.java
@@ -0,0 +1,139 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.exec;
+
+import org.apache.druid.frame.key.ClusterBy;
+import org.apache.druid.msq.kernel.StageDefinition;
+import org.apache.druid.msq.kernel.StageId;
+import org.apache.druid.msq.statistics.CompleteKeyStatisticsInformation;
+import org.junit.After;
+import org.junit.Before;
+import org.junit.Test;
+import org.mockito.Mock;
+import org.mockito.MockitoAnnotations;
+
+import java.util.Collections;
+
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.Mockito.doReturn;
+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.spy;
+import static org.mockito.Mockito.times;
+import static org.mockito.Mockito.verify;
+
+public class WorkerSketchFetcherAutoModeTest
+{
+  @Mock
+  private CompleteKeyStatisticsInformation completeKeyStatisticsInformation;
+  @Mock
+  private StageDefinition stageDefinition;
+  @Mock
+  private ClusterBy clusterBy;
+  private AutoCloseable mocks;
+  private WorkerSketchFetcher target;
+
+  @Before
+  public void setUp()
+  {
+    mocks = MockitoAnnotations.openMocks(this);
+
+    target = spy(new WorkerSketchFetcher(mock(WorkerClient.class), ClusterStatisticsMergeMode.AUTO, 300_000_000));
+    // Don't actually try to fetch sketches
+    doReturn(null).when(target).inMemoryFullSketchMerging(any(), any());
+    doReturn(null).when(target).sequentialTimeChunkMerging(any(), any(), any());
+
+    doReturn(StageId.fromString("1_1")).when(stageDefinition).getId();
+    doReturn(clusterBy).when(stageDefinition).getClusterBy();
+  }
+
+  @After
+  public void tearDown() throws Exception
+  {
+    mocks.close();
+  }
+
+  @Test
+  public void test_submitFetcherTask_belowThresholds_ShouldBeParallel()
+  {
+    // Bytes below threshold
+    doReturn(10.0).when(completeKeyStatisticsInformation).getBytesRetained();
+
+    // Cluster by bucket count not 0
+    doReturn(1).when(clusterBy).getBucketByCount();
+
+    // Worker count below threshold
+    doReturn(1).when(stageDefinition).getMaxWorkerCount();
+
+    target.submitFetcherTask(completeKeyStatisticsInformation, Collections.emptyList(), stageDefinition);
+    verify(target, times(1)).inMemoryFullSketchMerging(any(), any());
+    verify(target, times(0)).sequentialTimeChunkMerging(any(), any(), any());
+  }
+
+  @Test
+  public void test_submitFetcherTask_workerCountAboveThreshold_shouldBeSequential()
+  {
+    // Bytes below threshold
+    doReturn(10.0).when(completeKeyStatisticsInformation).getBytesRetained();
+
+    // Cluster by bucket count not 0
+    doReturn(1).when(clusterBy).getBucketByCount();
+
+    // Worker count below threshold
+    doReturn((int) WorkerSketchFetcher.WORKER_THRESHOLD + 1).when(stageDefinition).getMaxWorkerCount();
+
+    target.submitFetcherTask(completeKeyStatisticsInformation, Collections.emptyList(), stageDefinition);
+    verify(target, times(0)).inMemoryFullSketchMerging(any(), any());
+    verify(target, times(1)).sequentialTimeChunkMerging(any(), any(), any());
+  }
+
+  @Test
+  public void test_submitFetcherTask_noClusterByColumns_shouldBeParallel()
+  {
+    // Bytes above threshold
+    doReturn(WorkerSketchFetcher.BYTES_THRESHOLD + 10.0).when(completeKeyStatisticsInformation).getBytesRetained();
+
+    // Cluster by bucket count 0
+    doReturn(ClusterBy.none()).when(stageDefinition).getClusterBy();
+
+    // Worker count above threshold
+    doReturn((int) WorkerSketchFetcher.WORKER_THRESHOLD + 1).when(stageDefinition).getMaxWorkerCount();
+
+    target.submitFetcherTask(completeKeyStatisticsInformation, Collections.emptyList(), stageDefinition);
+    verify(target, times(1)).inMemoryFullSketchMerging(any(), any());
+    verify(target, times(0)).sequentialTimeChunkMerging(any(), any(), any());
+  }
+
+  @Test
+  public void test_submitFetcherTask_bytesRetainedAboveThreshold_shouldBeSequential()
+  {
+    // Bytes above threshold
+    doReturn(WorkerSketchFetcher.BYTES_THRESHOLD + 10.0).when(completeKeyStatisticsInformation).getBytesRetained();
+
+    // Cluster by bucket count not 0
+    doReturn(1).when(clusterBy).getBucketByCount();
+
+    // Worker count below threshold
+    doReturn(1).when(stageDefinition).getMaxWorkerCount();
+
+    target.submitFetcherTask(completeKeyStatisticsInformation, Collections.emptyList(), stageDefinition);
+    verify(target, times(0)).inMemoryFullSketchMerging(any(), any());
+    verify(target, times(1)).sequentialTimeChunkMerging(any(), any(), any());
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/WorkerSketchFetcherTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/WorkerSketchFetcherTest.java
new file mode 100644
index 000000000000..83fb73043bd9
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/exec/WorkerSketchFetcherTest.java
@@ -0,0 +1,200 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.exec;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableSet;
+import com.google.common.collect.ImmutableSortedMap;
+import com.google.common.util.concurrent.Futures;
+import org.apache.druid.frame.key.ClusterBy;
+import org.apache.druid.frame.key.ClusterByPartition;
+import org.apache.druid.frame.key.ClusterByPartitions;
+import org.apache.druid.frame.key.RowKey;
+import org.apache.druid.java.util.common.Either;
+import org.apache.druid.msq.kernel.StageDefinition;
+import org.apache.druid.msq.kernel.StageId;
+import org.apache.druid.msq.statistics.ClusterByStatisticsCollector;
+import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.CompleteKeyStatisticsInformation;
+import org.junit.After;
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Test;
+import org.mockito.Mock;
+import org.mockito.MockitoAnnotations;
+
+import java.util.List;
+import java.util.Queue;
+import java.util.Set;
+import java.util.SortedMap;
+import java.util.concurrent.CompletableFuture;
+import java.util.concurrent.ConcurrentLinkedQueue;
+import java.util.concurrent.CountDownLatch;
+import java.util.concurrent.CyclicBarrier;
+import java.util.concurrent.ExecutionException;
+
+import static org.easymock.EasyMock.mock;
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.ArgumentMatchers.anyInt;
+import static org.mockito.ArgumentMatchers.anyLong;
+import static org.mockito.ArgumentMatchers.eq;
+import static org.mockito.Mockito.doAnswer;
+import static org.mockito.Mockito.doReturn;
+import static org.mockito.Mockito.spy;
+import static org.mockito.Mockito.times;
+import static org.mockito.Mockito.verify;
+
+public class WorkerSketchFetcherTest
+{
+  @Mock
+  private CompleteKeyStatisticsInformation completeKeyStatisticsInformation;
+  @Mock
+  private StageDefinition stageDefinition;
+  @Mock
+  private ClusterBy clusterBy;
+  @Mock
+  private ClusterByStatisticsCollector mergedClusterByStatisticsCollector1;
+  @Mock
+  private ClusterByStatisticsCollector mergedClusterByStatisticsCollector2;
+  @Mock
+  private WorkerClient workerClient;
+  private ClusterByPartitions expectedPartitions1;
+  private ClusterByPartitions expectedPartitions2;
+  private AutoCloseable mocks;
+  private WorkerSketchFetcher target;
+
+  @Before
+  public void setUp()
+  {
+    mocks = MockitoAnnotations.openMocks(this);
+    doReturn(StageId.fromString("1_1")).when(stageDefinition).getId();
+    doReturn(clusterBy).when(stageDefinition).getClusterBy();
+    doReturn(25_000).when(stageDefinition).getMaxPartitionCount();
+
+    expectedPartitions1 = new ClusterByPartitions(ImmutableList.of(new ClusterByPartition(mock(RowKey.class), mock(RowKey.class))));
+    expectedPartitions2 = new ClusterByPartitions(ImmutableList.of(new ClusterByPartition(mock(RowKey.class), mock(RowKey.class))));
+
+    doReturn(Either.value(expectedPartitions1)).when(stageDefinition).generatePartitionsForShuffle(eq(mergedClusterByStatisticsCollector1));
+    doReturn(Either.value(expectedPartitions2)).when(stageDefinition).generatePartitionsForShuffle(eq(mergedClusterByStatisticsCollector2));
+
+    doReturn(
+        mergedClusterByStatisticsCollector1,
+        mergedClusterByStatisticsCollector2
+    ).when(stageDefinition).createResultKeyStatisticsCollector(anyInt());
+  }
+
+  @After
+  public void tearDown() throws Exception
+  {
+    mocks.close();
+    if (target != null) {
+      target.close();
+    }
+  }
+
+  @Test
+  public void test_submitFetcherTask_parallelFetch_mergePerformedCorrectly()
+      throws ExecutionException, InterruptedException
+  {
+    // Store snapshots in a queue
+    final Queue<ClusterByStatisticsSnapshot> snapshotQueue = new ConcurrentLinkedQueue<>();
+    final List<String> workerIds = ImmutableList.of("0", "1", "2", "3", "4");
+    final CountDownLatch latch = new CountDownLatch(workerIds.size());
+
+    target = spy(new WorkerSketchFetcher(workerClient, ClusterStatisticsMergeMode.PARALLEL, 300_000_000));
+
+    // When fetching snapshots, return a mock and add it to queue
+    doAnswer(invocation -> {
+      ClusterByStatisticsSnapshot snapshot = mock(ClusterByStatisticsSnapshot.class);
+      snapshotQueue.add(snapshot);
+      latch.countDown();
+      return Futures.immediateFuture(snapshot);
+    }).when(workerClient).fetchClusterByStatisticsSnapshot(any(), any(), anyInt());
+
+    CompletableFuture<Either<Long, ClusterByPartitions>> eitherCompletableFuture = target.submitFetcherTask(
+        completeKeyStatisticsInformation,
+        workerIds,
+        stageDefinition
+    );
+
+    // Assert that the final result is complete and all other sketches returned have been merged.
+    eitherCompletableFuture.join();
+    Thread.sleep(1000);
+    Assert.assertTrue(eitherCompletableFuture.isDone() && !eitherCompletableFuture.isCompletedExceptionally());
+    Assert.assertFalse(snapshotQueue.isEmpty());
+    // Verify that all statistics were added to controller.
+    for (ClusterByStatisticsSnapshot snapshot : snapshotQueue) {
+      verify(mergedClusterByStatisticsCollector1, times(1)).addAll(eq(snapshot));
+    }
+    // Check that the partitions returned by the merged collector is returned by the final future.
+    Assert.assertEquals(expectedPartitions1, eitherCompletableFuture.get().valueOrThrow());
+  }
+
+  @Test
+  public void test_submitFetcherTask_sequentialFetch_mergePerformedCorrectly()
+      throws ExecutionException, InterruptedException
+  {
+    // Store snapshots in a queue
+    final Queue<ClusterByStatisticsSnapshot> snapshotQueue = new ConcurrentLinkedQueue<>();
+
+    SortedMap<Long, Set<Integer>> timeSegmentVsWorkerMap = ImmutableSortedMap.of(1L, ImmutableSet.of(0, 1, 2), 2L, ImmutableSet.of(0, 1, 4));
+    doReturn(timeSegmentVsWorkerMap).when(completeKeyStatisticsInformation).getTimeSegmentVsWorkerMap();
+
+    final CyclicBarrier barrier = new CyclicBarrier(3);
+    target = spy(new WorkerSketchFetcher(workerClient, ClusterStatisticsMergeMode.SEQUENTIAL, 300_000_000));
+
+    // When fetching snapshots, return a mock and add it to queue
+    doAnswer(invocation -> {
+      ClusterByStatisticsSnapshot snapshot = mock(ClusterByStatisticsSnapshot.class);
+      snapshotQueue.add(snapshot);
+      barrier.await();
+      return Futures.immediateFuture(snapshot);
+    }).when(workerClient).fetchClusterByStatisticsSnapshotForTimeChunk(any(), any(), anyInt(), anyLong());
+
+    CompletableFuture<Either<Long, ClusterByPartitions>> eitherCompletableFuture = target.submitFetcherTask(
+        completeKeyStatisticsInformation,
+        ImmutableList.of("0", "1", "2", "3", "4"),
+        stageDefinition
+    );
+
+    // Assert that the final result is complete and all other sketches returned have been merged.
+    eitherCompletableFuture.join();
+    Thread.sleep(1000);
+
+    Assert.assertTrue(eitherCompletableFuture.isDone() && !eitherCompletableFuture.isCompletedExceptionally());
+    Assert.assertFalse(snapshotQueue.isEmpty());
+    // Verify that all statistics were added to controller.
+    snapshotQueue.stream().limit(3).forEach(snapshot -> {
+      verify(mergedClusterByStatisticsCollector1, times(1)).addAll(eq(snapshot));
+    });
+    snapshotQueue.stream().skip(3).limit(3).forEach(snapshot -> {
+      verify(mergedClusterByStatisticsCollector2, times(1)).addAll(eq(snapshot));
+    });
+    ClusterByPartitions expectedResult =
+        new ClusterByPartitions(
+            ImmutableList.of(
+                new ClusterByPartition(expectedPartitions1.get(0).getStart(), expectedPartitions2.get(0).getStart()),
+                new ClusterByPartition(expectedPartitions2.get(0).getStart(), expectedPartitions2.get(0).getEnd())
+            )
+        );
+    // Check that the partitions returned by the merged collector is returned by the final future.
+    Assert.assertEquals(expectedResult, eitherCompletableFuture.get().valueOrThrow());
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/error/MSQWarningsTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/error/MSQWarningsTest.java
index 5ad2191af3f1..7ec2766b5967 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/error/MSQWarningsTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/indexing/error/MSQWarningsTest.java
@@ -29,6 +29,7 @@
 import org.apache.druid.msq.indexing.MSQSpec;
 import org.apache.druid.msq.indexing.MSQTuningConfig;
 import org.apache.druid.msq.test.MSQTestBase;
+import org.apache.druid.msq.test.MSQTestFileUtils;
 import org.apache.druid.msq.util.MultiStageQueryContext;
 import org.apache.druid.query.Query;
 import org.apache.druid.query.aggregation.CountAggregatorFactory;
@@ -54,7 +55,6 @@
  */
 public class MSQWarningsTest extends MSQTestBase
 {
-
   private File toRead;
   private RowSignature rowSignature;
   private String toReadFileNameAsJson;
@@ -65,7 +65,7 @@ public class MSQWarningsTest extends MSQTestBase
   @Before
   public void setUp3() throws IOException
   {
-    toRead = getResourceAsTemporaryFile("/unparseable.gz");
+    toRead = MSQTestFileUtils.getResourceAsTemporaryFile(this, "/unparseable.gz");
     toReadFileNameAsJson = queryFramework().queryJsonMapper().writeValueAsString(toRead.getAbsolutePath());
 
     rowSignature = RowSignature.builder()
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/kernel/controller/BaseControllerQueryKernelTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/kernel/controller/BaseControllerQueryKernelTest.java
index c31d8c69fa99..f6b0ea9f08bb 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/kernel/controller/BaseControllerQueryKernelTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/kernel/controller/BaseControllerQueryKernelTest.java
@@ -21,6 +21,7 @@
 
 import com.google.common.base.Preconditions;
 import com.google.common.collect.ImmutableMap;
+import org.apache.druid.frame.key.ClusterByPartitions;
 import org.apache.druid.frame.key.KeyTestUtils;
 import org.apache.druid.frame.key.RowKey;
 import org.apache.druid.java.util.common.IAE;
@@ -31,6 +32,7 @@
 import org.apache.druid.msq.input.stage.StageInputSpec;
 import org.apache.druid.msq.input.stage.StageInputSpecSlicer;
 import org.apache.druid.msq.kernel.QueryDefinition;
+import org.apache.druid.msq.kernel.StageDefinition;
 import org.apache.druid.msq.kernel.StageId;
 import org.apache.druid.msq.kernel.WorkerAssignmentStrategy;
 import org.apache.druid.msq.statistics.ClusterByStatisticsCollector;
@@ -80,7 +82,7 @@ private ControllerQueryKernelTester(int numWorkers)
     public ControllerQueryKernelTester queryDefinition(QueryDefinition queryDefinition)
     {
       this.queryDefinition = Preconditions.checkNotNull(queryDefinition);
-      this.controllerQueryKernel = new ControllerQueryKernel(queryDefinition, 10_000_000);
+      this.controllerQueryKernel = new ControllerQueryKernel(queryDefinition);
       return this;
     }
 
@@ -121,10 +123,10 @@ public ControllerQueryKernelTester setupStage(
 
           if (queryDefinition.getStageDefinition(stageNumber).mustGatherResultKeyStatistics()) {
             for (int i = 0; i < numWorkers; ++i) {
-              controllerQueryKernel.addResultKeyStatisticsForStageAndWorker(
+              controllerQueryKernel.addPartialKeyStatisticsForStageAndWorker(
                   new StageId(queryDefinition.getQueryId(), stageNumber),
                   i,
-                  ClusterByStatisticsSnapshot.empty()
+                  ClusterByStatisticsSnapshot.empty().partialKeyStatistics()
               );
             }
           } else {
@@ -238,7 +240,7 @@ public void finishStage(int stageNumber, boolean strict)
       controllerQueryKernel.finishStage(new StageId(queryDefinition.getQueryId(), stageNumber), strict);
     }
 
-    public void addResultKeyStatisticsForStageAndWorker(int stageNumber, int workerNumber)
+    public ClusterByStatisticsCollector addResultKeyStatisticsForStageAndWorker(int stageNumber, int workerNumber)
     {
       Preconditions.checkArgument(initialized);
 
@@ -254,11 +256,12 @@ public void addResultKeyStatisticsForStageAndWorker(int stageNumber, int workerN
         keyStatsCollector.add(key, 1);
       }
 
-      controllerQueryKernel.addResultKeyStatisticsForStageAndWorker(
+      controllerQueryKernel.addPartialKeyStatisticsForStageAndWorker(
           new StageId(queryDefinition.getQueryId(), stageNumber),
           workerNumber,
-          keyStatsCollector.snapshot()
+          keyStatsCollector.snapshot().partialKeyStatistics()
       );
+      return keyStatsCollector;
     }
 
     public void setResultsCompleteForStageAndWorker(int stageNumber, int workerNumber)
@@ -271,6 +274,18 @@ public void setResultsCompleteForStageAndWorker(int stageNumber, int workerNumbe
       );
     }
 
+    public void setPartitionBoundaries(int stageNumber, ClusterByStatisticsCollector clusterByStatisticsCollector)
+    {
+      Preconditions.checkArgument(initialized);
+      StageId stageId = new StageId(queryDefinition.getQueryId(), stageNumber);
+      StageDefinition stageDefinition = controllerQueryKernel.getStageDefinition(stageId);
+      ClusterByPartitions clusterByPartitions =
+          stageDefinition
+              .generatePartitionsForShuffle(clusterByStatisticsCollector)
+              .valueOrThrow();
+      controllerQueryKernel.setClusterByPartitionBoundaries(stageId, clusterByPartitions);
+    }
+
     public void failStage(int stageNumber)
     {
       Preconditions.checkArgument(initialized);
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/kernel/controller/ControllerQueryKernelTests.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/kernel/controller/ControllerQueryKernelTests.java
index 3094bf344d2f..f2b6139e9985 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/kernel/controller/ControllerQueryKernelTests.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/kernel/controller/ControllerQueryKernelTests.java
@@ -20,6 +20,7 @@
 package org.apache.druid.msq.kernel.controller;
 
 import com.google.common.collect.ImmutableSet;
+import org.apache.druid.msq.statistics.ClusterByStatisticsCollector;
 import org.junit.Assert;
 import org.junit.Test;
 
@@ -146,8 +147,13 @@ public void testCompleteDAGExecutionForMultipleWorkers()
     Assert.assertEquals(ImmutableSet.of(0), newStageNumbers);
     Assert.assertEquals(ImmutableSet.of(), effectivelyFinishedStageNumbers);
     controllerQueryKernelTester.startStage(0);
-    controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(0, 0);
-    controllerQueryKernelTester.assertStagePhase(0, ControllerStagePhase.POST_READING);
+    ClusterByStatisticsCollector clusterByStatisticsCollector =
+        controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(
+            0,
+            0
+        );
+    controllerQueryKernelTester.assertStagePhase(0, ControllerStagePhase.MERGING_STATISTICS);
+    controllerQueryKernelTester.setPartitionBoundaries(0, clusterByStatisticsCollector);
     controllerQueryKernelTester.setResultsCompleteForStageAndWorker(0, 0);
     controllerQueryKernelTester.assertStagePhase(0, ControllerStagePhase.RESULTS_READY);
 
@@ -156,9 +162,20 @@ public void testCompleteDAGExecutionForMultipleWorkers()
     Assert.assertEquals(ImmutableSet.of(1), newStageNumbers);
     Assert.assertEquals(ImmutableSet.of(), effectivelyFinishedStageNumbers);
     controllerQueryKernelTester.startStage(1);
-    controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(1, 0);
+    clusterByStatisticsCollector =
+        controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(
+            1,
+            0
+        );
     controllerQueryKernelTester.assertStagePhase(1, ControllerStagePhase.READING_INPUT);
-    controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(1, 1);
+    clusterByStatisticsCollector.addAll(
+        controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(
+            1,
+            1
+        )
+    );
+    controllerQueryKernelTester.assertStagePhase(1, ControllerStagePhase.MERGING_STATISTICS);
+    controllerQueryKernelTester.setPartitionBoundaries(1, clusterByStatisticsCollector);
     controllerQueryKernelTester.assertStagePhase(1, ControllerStagePhase.POST_READING);
     controllerQueryKernelTester.setResultsCompleteForStageAndWorker(1, 0);
     controllerQueryKernelTester.assertStagePhase(1, ControllerStagePhase.POST_READING);
@@ -182,9 +199,19 @@ public void testCompleteDAGExecutionForMultipleWorkers()
     Assert.assertEquals(ImmutableSet.of(1), effectivelyFinishedStageNumbers);
     controllerQueryKernelTester.startStage(3);
     controllerQueryKernelTester.assertStagePhase(3, ControllerStagePhase.READING_INPUT);
-    controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(3, 0);
+    ClusterByStatisticsCollector clusterByStatisticsCollector3 =
+        controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(
+            3,
+            0
+        );
     controllerQueryKernelTester.assertStagePhase(3, ControllerStagePhase.READING_INPUT);
-    controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(3, 1);
+    ClusterByStatisticsCollector clusterByStatisticsCollector4 =
+        controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(
+        3,
+        1
+        );
+    controllerQueryKernelTester.assertStagePhase(3, ControllerStagePhase.MERGING_STATISTICS);
+    controllerQueryKernelTester.setPartitionBoundaries(3, clusterByStatisticsCollector3.addAll(clusterByStatisticsCollector4));
     controllerQueryKernelTester.assertStagePhase(3, ControllerStagePhase.POST_READING);
     controllerQueryKernelTester.setResultsCompleteForStageAndWorker(3, 0);
     controllerQueryKernelTester.assertStagePhase(3, ControllerStagePhase.POST_READING);
@@ -217,11 +244,21 @@ public void testTransitionsInShufflingStagesAndMultipleWorkers()
     controllerQueryKernelTester.createAndGetNewStageNumbers();
     controllerQueryKernelTester.startStage(0);
 
-    controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(0, 0);
+    ClusterByStatisticsCollector clusterByStatisticsCollector =
+        controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(
+            0,
+            0
+        );
     controllerQueryKernelTester.assertStagePhase(0, ControllerStagePhase.READING_INPUT);
 
-    controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(0, 1);
-    controllerQueryKernelTester.assertStagePhase(0, ControllerStagePhase.POST_READING);
+    clusterByStatisticsCollector.addAll(
+        controllerQueryKernelTester.addResultKeyStatisticsForStageAndWorker(
+            0,
+            1
+        )
+    );
+    controllerQueryKernelTester.assertStagePhase(0, ControllerStagePhase.MERGING_STATISTICS);
+    controllerQueryKernelTester.setPartitionBoundaries(0, clusterByStatisticsCollector);
 
     controllerQueryKernelTester.setResultsCompleteForStageAndWorker(0, 0);
     controllerQueryKernelTester.assertStagePhase(0, ControllerStagePhase.POST_READING);
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorTest.java
index 2ea2958c7368..d93e8df42df9 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorTest.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/querykit/scan/ScanQueryFrameProcessorTest.java
@@ -37,6 +37,7 @@
 import org.apache.druid.frame.write.FrameWriter;
 import org.apache.druid.frame.write.FrameWriterFactory;
 import org.apache.druid.frame.write.FrameWriters;
+import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.Intervals;
 import org.apache.druid.java.util.common.Pair;
 import org.apache.druid.java.util.common.concurrent.Execs;
@@ -152,7 +153,8 @@ public void close()
         },
         new LazyResourceHolder<>(() -> Pair.of(frameWriterFactory, () -> {})),
         null,
-        0L
+        0L,
+        new DefaultObjectMapper()
     );
 
     ListenableFuture<Long> retVal = exec.runFully(processor, null);
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/statistics/PartialKeyStatisticsInformationSerdeTest.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/statistics/PartialKeyStatisticsInformationSerdeTest.java
new file mode 100644
index 000000000000..c23106c0299d
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/statistics/PartialKeyStatisticsInformationSerdeTest.java
@@ -0,0 +1,62 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.statistics;
+
+import com.fasterxml.jackson.core.JsonParser;
+import com.fasterxml.jackson.core.JsonProcessingException;
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.collect.ImmutableSet;
+import org.apache.druid.msq.guice.MSQIndexingModule;
+import org.apache.druid.segment.TestHelper;
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Test;
+
+public class PartialKeyStatisticsInformationSerdeTest
+{
+  private ObjectMapper objectMapper;
+
+  @Before
+  public void setUp()
+  {
+    objectMapper = TestHelper.makeJsonMapper();
+    objectMapper.registerModules(new MSQIndexingModule().getJacksonModules());
+    objectMapper.enable(JsonParser.Feature.STRICT_DUPLICATE_DETECTION);
+  }
+
+  @Test
+  public void testSerde() throws JsonProcessingException
+  {
+    PartialKeyStatisticsInformation partialInformation = new PartialKeyStatisticsInformation(
+        ImmutableSet.of(2L, 3L),
+        false,
+        0.0
+    );
+
+    final String json = objectMapper.writeValueAsString(partialInformation);
+    final PartialKeyStatisticsInformation deserializedKeyStatistics = objectMapper.readValue(
+        json,
+        PartialKeyStatisticsInformation.class
+    );
+    Assert.assertEquals(json, partialInformation.getTimeSegments(), deserializedKeyStatistics.getTimeSegments());
+    Assert.assertEquals(json, partialInformation.hasMultipleValues(), deserializedKeyStatistics.hasMultipleValues());
+    Assert.assertEquals(json, partialInformation.getBytesRetained(), deserializedKeyStatistics.getBytesRetained(), 0);
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
index 096d2cba1c69..43ae5e0b0c97 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestBase.java
@@ -28,7 +28,7 @@
 import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
 import com.google.common.collect.Iterables;
-import com.google.common.io.ByteStreams;
+import com.google.inject.Binder;
 import com.google.inject.Injector;
 import com.google.inject.Key;
 import com.google.inject.Module;
@@ -41,6 +41,7 @@
 import org.apache.druid.data.input.impl.StringDimensionSchema;
 import org.apache.druid.discovery.NodeRole;
 import org.apache.druid.frame.testutil.FrameTestUtil;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.guice.DruidSecondaryModule;
 import org.apache.druid.guice.GuiceInjectors;
 import org.apache.druid.guice.IndexingServiceTuningConfigModule;
@@ -56,7 +57,7 @@
 import org.apache.druid.indexing.common.task.IndexTask;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexTuningConfig;
 import org.apache.druid.initialization.CoreInjectorBuilder;
-import org.apache.druid.java.util.common.IOE;
+import org.apache.druid.initialization.DruidModule;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Pair;
 import org.apache.druid.java.util.common.StringUtils;
@@ -67,6 +68,7 @@
 import org.apache.druid.java.util.common.io.Closer;
 import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.math.expr.ExprMacroTable;
+import org.apache.druid.metadata.input.InputSourceModule;
 import org.apache.druid.msq.exec.Controller;
 import org.apache.druid.msq.exec.WorkerMemoryParameters;
 import org.apache.druid.msq.guice.MSQDurableStorageModule;
@@ -131,6 +133,7 @@
 import org.apache.druid.sql.SqlToolbox;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.external.ExternalDataSource;
+import org.apache.druid.sql.calcite.external.ExternalOperatorConversion;
 import org.apache.druid.sql.calcite.planner.CalciteRulesManager;
 import org.apache.druid.sql.calcite.planner.PlannerConfig;
 import org.apache.druid.sql.calcite.planner.PlannerFactory;
@@ -143,6 +146,7 @@
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.SqlTestFramework;
 import org.apache.druid.sql.calcite.view.InProcessViewManager;
+import org.apache.druid.sql.guice.SqlBindings;
 import org.apache.druid.storage.StorageConnector;
 import org.apache.druid.storage.StorageConnectorProvider;
 import org.apache.druid.storage.local.LocalFileStorageConnector;
@@ -164,11 +168,10 @@
 
 import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
+
 import java.io.Closeable;
 import java.io.File;
 import java.io.IOException;
-import java.io.InputStream;
-import java.nio.file.Files;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collection;
@@ -227,6 +230,7 @@ public class MSQTestBase extends BaseCalciteQueryTest
   private static final Logger log = new Logger(MSQTestBase.class);
   private ObjectMapper objectMapper;
   private MSQTestOverlordServiceClient indexingServiceClient;
+  protected MSQTestTaskActionClient testTaskActionClient;
   private SqlStatementFactory sqlStatementFactory;
   private IndexIO indexIO;
 
@@ -246,12 +250,54 @@ public class MSQTestBase extends BaseCalciteQueryTest
       )
   );
 
+  @Override
+  public void configureGuice(DruidInjectorBuilder builder)
+  {
+    super.configureGuice(builder);
+
+    builder.addModule(new DruidModule() {
+
+      // Small subset of MsqSqlModule
+      @Override
+      public void configure(Binder binder)
+      {
+        // We want this module to bring InputSourceModule along for the ride.
+        binder.install(new InputSourceModule());
+        SqlBindings.addOperatorConversion(binder, ExternalOperatorConversion.class);
+      }
+
+      @Override
+      public List<? extends com.fasterxml.jackson.databind.Module> getJacksonModules()
+      {
+        // We want this module to bring input sources along for the ride.
+        return new InputSourceModule().getJacksonModules();
+      }
+    });
+  }
+
   @After
   public void tearDown2()
   {
     groupByBuffers.close();
   }
 
+  // This test is a Frankenstein creation: it uses the injector set up by the
+  // SqlTestFramework to pull items from that are then used to create another
+  // injector that has the MSQ dependencies. This allows the test to create a
+  // "shadow" statement factory that is used for tests. It works... kinda.
+  //
+  // Better would be to sort through the Guice stuff and move it into the
+  // configureGuice() method above: use the SQL test framework injector so
+  // that everything is coordinated. Use the planner factory provided by that
+  // framework.
+  //
+  // Leaving well enough alone for now because any change should be done by
+  // someone familiar with the rather complex setup code below.
+  //
+  // One brute-force attempt ran afoul of circular dependencies: the SQL engine
+  // is created in the main injector, but it depends on the SegmentCacheManagerFactory
+  // which depends on the object mapper that the injector will provide, once it
+  // is built, but has not yet been build while we build the SQL engine.
   @Before
   public void setUp2()
   {
@@ -294,7 +340,6 @@ public String getFormatString()
 
           GroupByQueryConfig groupByQueryConfig = new GroupByQueryConfig();
 
-
           binder.bind(DruidProcessingConfig.class).toInstance(druidProcessingConfig);
           binder.bind(new TypeLiteral<Set<NodeRole>>()
           {
@@ -389,10 +434,11 @@ public String getFormatString()
     objectMapper = setupObjectMapper(injector);
     objectMapper.registerModules(sqlModule.getJacksonModules());
 
+    testTaskActionClient = Mockito.spy(new MSQTestTaskActionClient(objectMapper));
     indexingServiceClient = new MSQTestOverlordServiceClient(
         objectMapper,
         injector,
-        new MSQTestTaskActionClient(objectMapper),
+        testTaskActionClient,
         workerMemoryParameters
     );
     final InProcessViewManager viewManager = new InProcessViewManager(SqlTestFramework.DRUID_VIEW_MACRO_FACTORY);
@@ -413,8 +459,8 @@ public String getFormatString()
 
     PlannerFactory plannerFactory = new PlannerFactory(
         rootSchema,
-        CalciteTests.createOperatorTable(),
-        CalciteTests.createExprMacroTable(),
+        qf.operatorTable(),
+        qf.macroTable(),
         PLANNER_CONFIG_DEFAULT,
         AuthTestUtils.TEST_AUTHORIZER_MAPPER,
         objectMapper,
@@ -446,22 +492,6 @@ protected Map<String, Object> defaultScanQueryContext(final RowSignature signatu
     }
   }
 
-  /**
-   * Helper method that copies a resource to a temporary file, then returns it.
-   */
-  protected File getResourceAsTemporaryFile(final String resource) throws IOException
-  {
-    final File file = temporaryFolder.newFile();
-    final InputStream stream = getClass().getResourceAsStream(resource);
-
-    if (stream == null) {
-      throw new IOE("No such resource [%s]", resource);
-    }
-
-    ByteStreams.copy(stream, Files.newOutputStream(file.toPath()));
-    return file;
-  }
-
   @Nonnull
   private Supplier<Pair<Segment, Closeable>> getSupplierForSegment(SegmentId segmentId)
   {
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestControllerClient.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestControllerClient.java
index 5b088b71d5bb..06b0bae29690 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestControllerClient.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestControllerClient.java
@@ -25,7 +25,7 @@
 import org.apache.druid.msq.exec.ControllerClient;
 import org.apache.druid.msq.indexing.error.MSQErrorReport;
 import org.apache.druid.msq.kernel.StageId;
-import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
+import org.apache.druid.msq.statistics.PartialKeyStatisticsInformation;
 
 import javax.annotation.Nullable;
 import java.util.List;
@@ -40,17 +40,17 @@ public MSQTestControllerClient(Controller controller)
   }
 
   @Override
-  public void postKeyStatistics(
+  public void postPartialKeyStatistics(
       StageId stageId,
       int workerNumber,
-      ClusterByStatisticsSnapshot keyStatistics
+      PartialKeyStatisticsInformation partialKeyStatisticsInformation
   )
   {
     try {
-      controller.updateStatus(stageId.getStageNumber(), workerNumber, keyStatistics);
+      controller.updatePartialKeyStatisticsInformation(stageId.getStageNumber(), workerNumber, partialKeyStatisticsInformation);
     }
     catch (Exception e) {
-      throw new ISE(e, "unable to post key statistics");
+      throw new ISE(e, "unable to post partial key statistics");
     }
   }
 
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestFileUtils.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestFileUtils.java
new file mode 100644
index 000000000000..70c2f55ea33f
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestFileUtils.java
@@ -0,0 +1,74 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.msq.test;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.io.ByteStreams;
+import org.apache.druid.java.util.common.IOE;
+import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
+
+import java.io.File;
+import java.io.IOException;
+import java.io.InputStream;
+import java.nio.charset.StandardCharsets;
+import java.nio.file.Files;
+import java.nio.file.StandardOpenOption;
+
+public class MSQTestFileUtils
+{
+
+  /**
+   * Helper method that copies a resource to a temporary file, then returns it.
+   */
+  public static File getResourceAsTemporaryFile(Object object, final String resource) throws IOException
+  {
+    final File file = BaseCalciteQueryTest.temporaryFolder.newFile();
+    final InputStream stream = object.getClass().getResourceAsStream(resource);
+
+    if (stream == null) {
+      throw new IOE("No such resource [%s]", resource);
+    }
+
+    ByteStreams.copy(stream, Files.newOutputStream(file.toPath()));
+    return file;
+  }
+
+  /**
+   * Helper method that populates a temporary file with {@code numRows} rows and {@code numColumns} columns where the
+   * first column is a string 'timestamp' while the rest are string columns with junk value
+   */
+  public static File generateTemporaryNdJsonFile(final int numRows, final int numColumns) throws IOException
+  {
+    final File file = BaseCalciteQueryTest.temporaryFolder.newFile();
+    for (int currentRow = 0; currentRow < numRows; ++currentRow) {
+      StringBuilder sb = new StringBuilder();
+      sb.append("{");
+      sb.append("\"timestamp\":\"2016-06-27T00:00:11.080Z\"");
+      for (int currentColumn = 1; currentColumn < numColumns; ++currentColumn) {
+        sb.append(StringUtils.format(",\"column%s\":\"val%s\"", currentColumn, currentRow));
+      }
+      sb.append("}");
+      Files.write(file.toPath(), ImmutableList.of(sb.toString()), StandardCharsets.UTF_8, StandardOpenOption.APPEND);
+    }
+    file.deleteOnExit();
+    return file;
+  }
+}
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestOverlordServiceClient.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestOverlordServiceClient.java
index 87a6f86ee85b..fc5ef645f7ad 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestOverlordServiceClient.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestOverlordServiceClient.java
@@ -115,5 +115,4 @@ MSQSpec getQuerySpecForTask(String id)
   {
     return msqSpec.get(id);
   }
-
 }
diff --git a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestWorkerClient.java b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestWorkerClient.java
index 094c1bd16cf7..ae892c34500a 100644
--- a/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestWorkerClient.java
+++ b/extensions-core/multi-stage-query/src/test/java/org/apache/druid/msq/test/MSQTestWorkerClient.java
@@ -29,6 +29,7 @@
 import org.apache.druid.msq.exec.WorkerClient;
 import org.apache.druid.msq.kernel.StageId;
 import org.apache.druid.msq.kernel.WorkOrder;
+import org.apache.druid.msq.statistics.ClusterByStatisticsSnapshot;
 
 import java.io.InputStream;
 import java.util.Arrays;
@@ -50,6 +51,29 @@ public ListenableFuture<Void> postWorkOrder(String workerTaskId, WorkOrder workO
     return Futures.immediateFuture(null);
   }
 
+  @Override
+  public ListenableFuture<ClusterByStatisticsSnapshot> fetchClusterByStatisticsSnapshot(
+      String workerTaskId,
+      String queryId,
+      int stageNumber
+  )
+  {
+    StageId stageId = new StageId(queryId, stageNumber);
+    return Futures.immediateFuture(inMemoryWorkers.get(workerTaskId).fetchStatisticsSnapshot(stageId));
+  }
+
+  @Override
+  public ListenableFuture<ClusterByStatisticsSnapshot> fetchClusterByStatisticsSnapshotForTimeChunk(
+      String workerTaskId,
+      String queryId,
+      int stageNumber,
+      long timeChunk
+  )
+  {
+    StageId stageId = new StageId(queryId, stageNumber);
+    return Futures.immediateFuture(inMemoryWorkers.get(workerTaskId).fetchStatisticsSnapshotForTimeChunk(stageId, timeChunk));
+  }
+
   @Override
   public ListenableFuture<Void> postResultPartitionBoundaries(
       String workerTaskId,
diff --git a/extensions-core/multi-stage-query/src/test/resources/unparseable-mv-string-array.json b/extensions-core/multi-stage-query/src/test/resources/unparseable-mv-string-array.json
new file mode 100644
index 000000000000..57b9a7709b09
--- /dev/null
+++ b/extensions-core/multi-stage-query/src/test/resources/unparseable-mv-string-array.json
@@ -0,0 +1,3 @@
+{"timestamp":"2019-08-25T00:00:00.031Z","agent_category":"Personal computer","agent_type":"Browser","browser":"Chrome","browser_version":"76.0.3809.100","city":"Rosario","continent":"South America","country":"Argentina","version":"1.9.6","event_type":"PercentClear","event_subtype":"55","loaded_image":"http://www.koalastothemax.com/img/koalas2.jpg","adblock_list":"NoAdblock","forwarded_for":"181.13.41.82","language":[{},{}],"number":"16","os":"Windows 7","path":"http://www.koalastothemax.com/","platform":"Windows","referrer":"Direct","referrer_host":"Direct","region":"Santa Fe","remote_address":"172.31.57.89","screen":"1680x1050","session":"S56194838","session_length":76261,"timezone":"N/A","timezone_offset":"180","window":"1680x939"}
+{"timestamp":"2019-08-25T00:00:00.059Z","agent_category":"Smartphone","agent_type":"Mobile Browser","browser":"Chrome Mobile","browser_version":"50.0.2661.89","city":"Nuevo Casas Grandes","continent":"North America","country":"Mexico","version":"1.9.6","event_type":"PercentClear","event_subtype":"85","loaded_image":"https://koalastothemax.com/img/koalas1.jpg","adblock_list":"NoAdblock","forwarded_for":"177.242.100.0","language":["en","es","es-419","es-MX"],"number":"24","os":"Android","path":"https://koalastothemax.com/","platform":"Android","referrer":"https://www.google.com/","referrer_host":"www.google.com","region":"Chihuahua","remote_address":"172.31.11.5","screen":"320x570","session":"S46093731","session_length":252689,"timezone":"CDT","timezone_offset":"300","window":"540x743"}
+{"timestamp":"2019-08-25T00:00:00.178Z","agent_category":"Personal computer","agent_type":"Browser","browser":"Chrome","browser_version":"76.0.3809.100","city":"Luis Guillon","continent":"South America","country":"Argentina","version":"1.9.6","event_type":"PercentClear","event_subtype":"90","loaded_image":"http://www.koalastothemax.com/img/koalas.jpg","adblock_list":"NoAdblock","forwarded_for":"181.46.136.44","language":["en","es","es-419","es-US"],"number":"24","os":"Windows 7","path":"http://www.koalastothemax.com/","platform":"Windows","referrer":"Direct","referrer_host":"Direct","region":"Buenos Aires","remote_address":"172.31.11.5","screen":"1366x768","session":"S13352079","session_length":1753602,"timezone":"N/A","timezone_offset":"180","window":"1366x652"}
diff --git a/extensions-core/mysql-metadata-storage/pom.xml b/extensions-core/mysql-metadata-storage/pom.xml
index de6512d44d3c..1238d601dbd7 100644
--- a/extensions-core/mysql-metadata-storage/pom.xml
+++ b/extensions-core/mysql-metadata-storage/pom.xml
@@ -30,7 +30,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/orc-extensions/example/test_simple.orc b/extensions-core/orc-extensions/example/test_simple.orc
new file mode 100644
index 000000000000..31c5391fb687
Binary files /dev/null and b/extensions-core/orc-extensions/example/test_simple.orc differ
diff --git a/extensions-core/orc-extensions/pom.xml b/extensions-core/orc-extensions/pom.xml
index 57812e840d0d..9de5c3a91fd6 100644
--- a/extensions-core/orc-extensions/pom.xml
+++ b/extensions-core/orc-extensions/pom.xml
@@ -26,7 +26,7 @@
     <parent>
         <artifactId>druid</artifactId>
         <groupId>org.apache.druid</groupId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
     <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-core/orc-extensions/src/test/java/org/apache/druid/data/input/orc/OrcReaderTest.java b/extensions-core/orc-extensions/src/test/java/org/apache/druid/data/input/orc/OrcReaderTest.java
index d0f012245b03..03083f61ebc8 100644
--- a/extensions-core/orc-extensions/src/test/java/org/apache/druid/data/input/orc/OrcReaderTest.java
+++ b/extensions-core/orc-extensions/src/test/java/org/apache/druid/data/input/orc/OrcReaderTest.java
@@ -29,6 +29,7 @@
 import org.apache.druid.data.input.InputRowSchema;
 import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.data.input.impl.FileEntity;
+import org.apache.druid.data.input.impl.StringDimensionSchema;
 import org.apache.druid.data.input.impl.TimestampSpec;
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.parsers.CloseableIterator;
@@ -569,6 +570,44 @@ public void testNestedArray() throws IOException
     }
   }
 
+  @Test
+  public void testSimpleNullValues() throws IOException
+  {
+    final InputFormat inputFormat = new OrcInputFormat(
+        new JSONPathSpec(
+            true,
+            ImmutableList.of()
+        ),
+        null,
+        new Configuration()
+    );
+    final InputEntityReader reader = createReader(
+        new TimestampSpec("timestamp", "auto", null),
+        new DimensionsSpec(
+            ImmutableList.of(
+                new StringDimensionSchema("c1"),
+                new StringDimensionSchema("c2")
+            )
+        ),
+        inputFormat,
+        "example/test_simple.orc"
+    );
+    try (CloseableIterator<InputRow> iterator = reader.read()) {
+      Assert.assertTrue(iterator.hasNext());
+      InputRow row = iterator.next();
+
+      Assert.assertEquals(DateTimes.of("2022-01-01T00:00:00.000Z"), row.getTimestamp());
+      Assert.assertEquals("true", Iterables.getOnlyElement(row.getDimension("c1")));
+      Assert.assertEquals("str1", Iterables.getOnlyElement(row.getDimension("c2")));
+
+      row = iterator.next();
+      Assert.assertEquals(DateTimes.of("2022-01-02T00:00:00.000Z"), row.getTimestamp());
+      Assert.assertEquals(ImmutableList.of(), row.getDimension("c1"));
+      Assert.assertEquals(ImmutableList.of(), row.getDimension("c2"));
+      Assert.assertFalse(iterator.hasNext());
+    }
+  }
+
   private InputEntityReader createReader(
       TimestampSpec timestampSpec,
       DimensionsSpec dimensionsSpec,
diff --git a/extensions-core/parquet-extensions/pom.xml b/extensions-core/parquet-extensions/pom.xml
index 2870b5c1dbef..ab834af8fa7a 100644
--- a/extensions-core/parquet-extensions/pom.xml
+++ b/extensions-core/parquet-extensions/pom.xml
@@ -27,7 +27,7 @@
   <parent>
     <artifactId>druid</artifactId>
     <groupId>org.apache.druid</groupId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-core/postgresql-metadata-storage/pom.xml b/extensions-core/postgresql-metadata-storage/pom.xml
index f6c3b8534348..78aa3c0ac4ae 100644
--- a/extensions-core/postgresql-metadata-storage/pom.xml
+++ b/extensions-core/postgresql-metadata-storage/pom.xml
@@ -30,7 +30,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/protobuf-extensions/pom.xml b/extensions-core/protobuf-extensions/pom.xml
index c7b7fc6e8b8c..0085f21aa564 100644
--- a/extensions-core/protobuf-extensions/pom.xml
+++ b/extensions-core/protobuf-extensions/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <artifactId>druid</artifactId>
     <groupId>org.apache.druid</groupId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/s3-extensions/pom.xml b/extensions-core/s3-extensions/pom.xml
index 14b6ff9f6c59..0b1eacf79bdb 100644
--- a/extensions-core/s3-extensions/pom.xml
+++ b/extensions-core/s3-extensions/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/simple-client-sslcontext/pom.xml b/extensions-core/simple-client-sslcontext/pom.xml
index 9dd441647558..ef5fb1bb836b 100644
--- a/extensions-core/simple-client-sslcontext/pom.xml
+++ b/extensions-core/simple-client-sslcontext/pom.xml
@@ -22,7 +22,7 @@
   <parent>
     <artifactId>druid</artifactId>
     <groupId>org.apache.druid</groupId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
   <modelVersion>4.0.0</modelVersion>
diff --git a/extensions-core/stats/pom.xml b/extensions-core/stats/pom.xml
index caddef0821da..7eddbc61ef32 100644
--- a/extensions-core/stats/pom.xml
+++ b/extensions-core/stats/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java b/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java
index 03678a603cfc..bc1ef6816930 100644
--- a/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java
+++ b/extensions-core/stats/src/test/java/org/apache/druid/query/aggregation/variance/sql/VarianceSqlAggregatorTest.java
@@ -19,10 +19,8 @@
 
 package org.apache.druid.query.aggregation.variance.sql;
 
-import com.fasterxml.jackson.databind.Module;
 import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.data.input.impl.DimensionSchema;
@@ -30,6 +28,7 @@
 import org.apache.druid.data.input.impl.DoubleDimensionSchema;
 import org.apache.druid.data.input.impl.FloatDimensionSchema;
 import org.apache.druid.data.input.impl.LongDimensionSchema;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.Druids;
@@ -56,7 +55,6 @@
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
@@ -70,28 +68,18 @@
 
 public class VarianceSqlAggregatorTest extends BaseCalciteQueryTest
 {
-  private static final DruidOperatorTable OPERATOR_TABLE = new DruidOperatorTable(
-      ImmutableSet.of(
-          new BaseVarianceSqlAggregator.VarPopSqlAggregator(),
-          new BaseVarianceSqlAggregator.VarSampSqlAggregator(),
-          new BaseVarianceSqlAggregator.VarianceSqlAggregator(),
-          new BaseVarianceSqlAggregator.StdDevPopSqlAggregator(),
-          new BaseVarianceSqlAggregator.StdDevSampSqlAggregator(),
-          new BaseVarianceSqlAggregator.StdDevSqlAggregator()
-      ),
-      ImmutableSet.of()
-  );
-
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    return Iterables.concat(super.getJacksonModules(), new DruidStatsModule().getJacksonModules());
+    super.configureGuice(builder);
+    builder.addModule(new DruidStatsModule());
   }
 
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     final QueryableIndex index =
@@ -132,12 +120,6 @@ public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
     );
   }
 
-  @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return OPERATOR_TABLE;
-  }
-
   public void addToHolder(VarianceAggregatorCollector holder, Object raw)
   {
     addToHolder(holder, raw, 1);
diff --git a/extensions-core/testing-tools/pom.xml b/extensions-core/testing-tools/pom.xml
index f20c090969c9..c9a7c88d5600 100644
--- a/extensions-core/testing-tools/pom.xml
+++ b/extensions-core/testing-tools/pom.xml
@@ -29,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <relativePath>../../pom.xml</relativePath>
   </parent>
 
diff --git a/extensions-core/testing-tools/src/test/java/org/apache/druid/query/sql/SleepSqlTest.java b/extensions-core/testing-tools/src/test/java/org/apache/druid/query/sql/SleepSqlTest.java
index cb3e9efdf070..c3b1a102f3de 100644
--- a/extensions-core/testing-tools/src/test/java/org/apache/druid/query/sql/SleepSqlTest.java
+++ b/extensions-core/testing-tools/src/test/java/org/apache/druid/query/sql/SleepSqlTest.java
@@ -20,15 +20,11 @@
 package org.apache.druid.query.sql;
 
 import com.google.common.collect.ImmutableList;
-import com.google.common.collect.ImmutableSet;
 import org.apache.druid.common.config.NullHandling;
-import org.apache.druid.guice.ExpressionModule;
-import org.apache.druid.math.expr.ExprMacroTable;
-import org.apache.druid.math.expr.ExprMacroTable.ExprMacro;
+import org.apache.druid.guice.DruidInjectorBuilder;
+import org.apache.druid.guice.SleepModule;
 import org.apache.druid.query.Druids;
 import org.apache.druid.query.TableDataSource;
-import org.apache.druid.query.expression.LookupExprMacro;
-import org.apache.druid.query.expressions.SleepExprMacro;
 import org.apache.druid.query.filter.BoundDimFilter;
 import org.apache.druid.query.ordering.StringComparators;
 import org.apache.druid.query.scan.ScanQuery.ResultFormat;
@@ -36,34 +32,15 @@
 import org.apache.druid.segment.virtual.ExpressionVirtualColumn;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest;
 import org.apache.druid.sql.calcite.filtration.Filtration;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
-import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.junit.Test;
 
-import java.util.ArrayList;
-import java.util.List;
-
 public class SleepSqlTest extends BaseCalciteQueryTest
 {
   @Override
-  public DruidOperatorTable createOperatorTable()
-  {
-    return new DruidOperatorTable(
-        ImmutableSet.of(),
-        ImmutableSet.of(new SleepOperatorConversion())
-    );
-  }
-
-  @Override
-  public ExprMacroTable createMacroTable()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    final List<ExprMacro> exprMacros = new ArrayList<>();
-    for (Class<? extends ExprMacroTable.ExprMacro> clazz : ExpressionModule.EXPR_MACROS) {
-      exprMacros.add(CalciteTests.INJECTOR.getInstance(clazz));
-    }
-    exprMacros.add(CalciteTests.INJECTOR.getInstance(LookupExprMacro.class));
-    exprMacros.add(new SleepExprMacro());
-    return new ExprMacroTable(exprMacros);
+    super.configureGuice(builder);
+    builder.addModule(new SleepModule());
   }
 
   @Test
@@ -80,7 +57,7 @@ public void testSleepFunction()
                           "v0",
                           "sleep(\"m1\")",
                           ColumnType.STRING,
-                          createMacroTable()
+                          queryFramework().macroTable()
                       )
                   )
                   .columns("v0")
diff --git a/hll/pom.xml b/hll/pom.xml
index 876257a84469..f39a6d33c461 100644
--- a/hll/pom.xml
+++ b/hll/pom.xml
@@ -24,7 +24,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
     </parent>
 
     <artifactId>druid-hll</artifactId>
diff --git a/indexing-hadoop/pom.xml b/indexing-hadoop/pom.xml
index d93a8c698247..7f56e7f7562d 100644
--- a/indexing-hadoop/pom.xml
+++ b/indexing-hadoop/pom.xml
@@ -28,7 +28,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
     </parent>
 
     <dependencies>
diff --git a/indexing-service/pom.xml b/indexing-service/pom.xml
index cba1cace7081..1ea333873843 100644
--- a/indexing-service/pom.xml
+++ b/indexing-service/pom.xml
@@ -29,7 +29,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
     </parent>
 
     <dependencies>
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/TaskToolbox.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/TaskToolbox.java
index 6b2fad9610b3..03a4849e602e 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/TaskToolbox.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/TaskToolbox.java
@@ -20,7 +20,6 @@
 package org.apache.druid.indexing.common;
 
 import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.base.Function;
 import com.google.common.base.Preconditions;
 import com.google.common.collect.ImmutableSet;
 import com.google.common.collect.Multimap;
@@ -33,7 +32,7 @@
 import org.apache.druid.discovery.DataNodeService;
 import org.apache.druid.discovery.DruidNodeAnnouncer;
 import org.apache.druid.discovery.LookupNodeService;
-import org.apache.druid.indexing.common.actions.SegmentInsertAction;
+import org.apache.druid.indexing.common.actions.SegmentTransactionalInsertAction;
 import org.apache.druid.indexing.common.actions.TaskActionClient;
 import org.apache.druid.indexing.common.config.TaskConfig;
 import org.apache.druid.indexing.common.task.batch.parallel.ParallelIndexSupervisorTaskClientProvider;
@@ -329,17 +328,14 @@ public void publishSegments(Iterable<DataSegment> segments) throws IOException
     // Request segment pushes for each set
     final Multimap<Interval, DataSegment> segmentMultimap = Multimaps.index(
         segments,
-        new Function<DataSegment, Interval>()
-        {
-          @Override
-          public Interval apply(DataSegment segment)
-          {
-            return segment.getInterval();
-          }
-        }
+        DataSegment::getInterval
     );
     for (final Collection<DataSegment> segmentCollection : segmentMultimap.asMap().values()) {
-      getTaskActionClient().submit(new SegmentInsertAction(ImmutableSet.copyOf(segmentCollection)));
+      getTaskActionClient().submit(
+          SegmentTransactionalInsertAction.appendAction(
+              ImmutableSet.copyOf(segmentCollection), null, null
+          )
+      );
     }
   }
 
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/LocalTaskActionClient.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/LocalTaskActionClient.java
index 27e0bcbaa29d..a07977c6a564 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/LocalTaskActionClient.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/LocalTaskActionClient.java
@@ -30,6 +30,7 @@
 
 import javax.annotation.Nullable;
 import java.util.Map;
+import java.util.concurrent.TimeUnit;
 
 public class LocalTaskActionClient implements TaskActionClient
 {
@@ -76,11 +77,28 @@ public <RetType> RetType submit(TaskAction<RetType> taskAction)
     }
 
     final long performStartTime = System.currentTimeMillis();
-    final RetType result = taskAction.perform(task, toolbox);
+    final RetType result = performAction(taskAction);
     emitTimerMetric("task/action/run/time", taskAction, System.currentTimeMillis() - performStartTime);
     return result;
   }
 
+  private <R> R performAction(TaskAction<R> taskAction)
+  {
+    try {
+      final R result;
+      if (taskAction.canPerformAsync(task, toolbox)) {
+        result = taskAction.performAsync(task, toolbox).get(5, TimeUnit.MINUTES);
+      } else {
+        result = taskAction.perform(task, toolbox);
+      }
+
+      return result;
+    }
+    catch (Throwable t) {
+      throw new RuntimeException(t);
+    }
+  }
+
   private void emitTimerMetric(final String metric, final TaskAction<?> action, final long time)
   {
     final ServiceMetricEvent.Builder metricBuilder = ServiceMetricEvent.builder();
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateAction.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateAction.java
index f61dad98168d..f0fae4a8617d 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateAction.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateAction.java
@@ -47,6 +47,7 @@
 import java.util.HashSet;
 import java.util.List;
 import java.util.Set;
+import java.util.concurrent.Future;
 import java.util.concurrent.ThreadLocalRandom;
 import java.util.stream.Collectors;
 
@@ -180,6 +181,23 @@ public TypeReference<SegmentIdWithShardSpec> getReturnTypeReference()
     };
   }
 
+  @Override
+  public boolean canPerformAsync(Task task, TaskActionToolbox toolbox)
+  {
+    return toolbox.canBatchSegmentAllocation();
+  }
+
+  @Override
+  public Future<SegmentIdWithShardSpec> performAsync(Task task, TaskActionToolbox toolbox)
+  {
+    if (!toolbox.canBatchSegmentAllocation()) {
+      throw new ISE("Batched segment allocation is disabled");
+    }
+    return toolbox.getSegmentAllocationQueue().add(
+        new SegmentAllocateRequest(task, this, MAX_ATTEMPTS)
+    );
+  }
+
   @Override
   public SegmentIdWithShardSpec perform(
       final Task task,
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateRequest.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateRequest.java
new file mode 100644
index 000000000000..adac7523f442
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateRequest.java
@@ -0,0 +1,77 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import org.apache.druid.indexing.common.task.Task;
+import org.joda.time.Interval;
+import org.joda.time.chrono.ISOChronology;
+
+/**
+ * Request received by the overlord for segment allocation.
+ */
+public class SegmentAllocateRequest
+{
+  private final Task task;
+  private final SegmentAllocateAction action;
+  private final int maxAttempts;
+  private final Interval rowInterval;
+
+  private int attempts;
+
+  public SegmentAllocateRequest(Task task, SegmentAllocateAction action, int maxAttempts)
+  {
+    this.task = task;
+    this.action = action;
+    this.maxAttempts = maxAttempts;
+    this.rowInterval = action.getQueryGranularity()
+                             .bucket(action.getTimestamp())
+                             .withChronology(ISOChronology.getInstanceUTC());
+  }
+
+  public Task getTask()
+  {
+    return task;
+  }
+
+  public SegmentAllocateAction getAction()
+  {
+    return action;
+  }
+
+  public void incrementAttempts()
+  {
+    ++attempts;
+  }
+
+  public boolean canRetry()
+  {
+    return attempts < maxAttempts;
+  }
+
+  public int getAttempts()
+  {
+    return attempts;
+  }
+
+  public Interval getRowInterval()
+  {
+    return rowInterval;
+  }
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateResult.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateResult.java
new file mode 100644
index 000000000000..995bfb9d31d0
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocateResult.java
@@ -0,0 +1,49 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import org.apache.druid.segment.realtime.appenderator.SegmentIdWithShardSpec;
+
+public class SegmentAllocateResult
+{
+  private final SegmentIdWithShardSpec segmentId;
+  private final String errorMessage;
+
+  public SegmentAllocateResult(SegmentIdWithShardSpec segmentId, String errorMessage)
+  {
+    this.segmentId = segmentId;
+    this.errorMessage = errorMessage;
+  }
+
+  public SegmentIdWithShardSpec getSegmentId()
+  {
+    return segmentId;
+  }
+
+  public String getErrorMessage()
+  {
+    return errorMessage;
+  }
+
+  public boolean isSuccess()
+  {
+    return segmentId != null;
+  }
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocationQueue.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocationQueue.java
new file mode 100644
index 000000000000..d60149d6245c
--- /dev/null
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/SegmentAllocationQueue.java
@@ -0,0 +1,744 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import com.google.inject.Inject;
+import org.apache.druid.guice.ManageLifecycle;
+import org.apache.druid.indexing.common.LockGranularity;
+import org.apache.druid.indexing.common.task.IndexTaskUtils;
+import org.apache.druid.indexing.common.task.Task;
+import org.apache.druid.indexing.overlord.IndexerMetadataStorageCoordinator;
+import org.apache.druid.indexing.overlord.Segments;
+import org.apache.druid.indexing.overlord.TaskLockbox;
+import org.apache.druid.indexing.overlord.config.TaskLockConfig;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.concurrent.ScheduledExecutorFactory;
+import org.apache.druid.java.util.common.granularity.Granularity;
+import org.apache.druid.java.util.common.guava.Comparators;
+import org.apache.druid.java.util.common.lifecycle.LifecycleStart;
+import org.apache.druid.java.util.common.lifecycle.LifecycleStop;
+import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.java.util.emitter.service.ServiceEmitter;
+import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
+import org.apache.druid.query.DruidMetrics;
+import org.apache.druid.segment.realtime.appenderator.SegmentIdWithShardSpec;
+import org.apache.druid.timeline.DataSegment;
+import org.joda.time.Interval;
+
+import java.util.ArrayList;
+import java.util.HashMap;
+import java.util.HashSet;
+import java.util.List;
+import java.util.Map;
+import java.util.Objects;
+import java.util.Set;
+import java.util.TreeSet;
+import java.util.concurrent.BlockingDeque;
+import java.util.concurrent.CompletableFuture;
+import java.util.concurrent.ConcurrentHashMap;
+import java.util.concurrent.Future;
+import java.util.concurrent.LinkedBlockingDeque;
+import java.util.concurrent.ScheduledExecutorService;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicReference;
+
+/**
+ * Queue for {@link SegmentAllocateRequest}s.
+ */
+@ManageLifecycle
+public class SegmentAllocationQueue
+{
+  private static final Logger log = new Logger(SegmentAllocationQueue.class);
+
+  private static final int MAX_QUEUE_SIZE = 2000;
+  private static final int MAX_BATCH_SIZE = 500;
+
+  private final long maxWaitTimeMillis;
+
+  private final TaskLockbox taskLockbox;
+  private final ScheduledExecutorService executor;
+  private final IndexerMetadataStorageCoordinator metadataStorage;
+  private final AtomicBoolean isLeader = new AtomicBoolean(false);
+  private final ServiceEmitter emitter;
+
+  private final ConcurrentHashMap<AllocateRequestKey, AllocateRequestBatch> keyToBatch = new ConcurrentHashMap<>();
+  private final BlockingDeque<AllocateRequestKey> processingQueue = new LinkedBlockingDeque<>(MAX_QUEUE_SIZE);
+
+  @Inject
+  public SegmentAllocationQueue(
+      TaskLockbox taskLockbox,
+      TaskLockConfig taskLockConfig,
+      IndexerMetadataStorageCoordinator metadataStorage,
+      ServiceEmitter emitter,
+      ScheduledExecutorFactory executorFactory
+  )
+  {
+    this.emitter = emitter;
+    this.taskLockbox = taskLockbox;
+    this.metadataStorage = metadataStorage;
+    this.maxWaitTimeMillis = taskLockConfig.getBatchAllocationWaitTime();
+
+    this.executor = taskLockConfig.isBatchSegmentAllocation()
+                    ? executorFactory.create(1, "SegmentAllocQueue-%s") : null;
+  }
+
+  @LifecycleStart
+  public void start()
+  {
+    if (isEnabled()) {
+      log.info("Initializing segment allocation queue.");
+      scheduleQueuePoll(maxWaitTimeMillis);
+    }
+  }
+
+  @LifecycleStop
+  public void stop()
+  {
+    if (isEnabled()) {
+      log.info("Tearing down segment allocation queue.");
+      executor.shutdownNow();
+    }
+  }
+
+  public void becomeLeader()
+  {
+    if (!isLeader.compareAndSet(false, true)) {
+      log.info("Already the leader. Queue processing has started.");
+    } else if (isEnabled()) {
+      log.info("Elected leader. Starting queue processing.");
+    } else {
+      log.info(
+          "Elected leader but batched segment allocation is disabled. "
+          + "Segment allocation queue will not be used."
+      );
+    }
+  }
+
+  public void stopBeingLeader()
+  {
+    if (!isLeader.compareAndSet(true, false)) {
+      log.info("Already surrendered leadership. Queue processing is stopped.");
+    } else if (isEnabled()) {
+      log.info("Not leader anymore. Stopping queue processing.");
+    } else {
+      log.info("Not leader anymore. Segment allocation queue is already disabled.");
+    }
+  }
+
+  public boolean isEnabled()
+  {
+    return executor != null && !executor.isShutdown();
+  }
+
+  private void scheduleQueuePoll(long delay)
+  {
+    executor.schedule(this::processBatchesDue, delay, TimeUnit.MILLISECONDS);
+  }
+
+  /**
+   * Gets the number of batches currently in the queue.
+   */
+  public int size()
+  {
+    return processingQueue.size();
+  }
+
+  /**
+   * Queues a SegmentAllocateRequest. The returned future may complete successfully
+   * with a non-null value or with a non-null value.
+   */
+  public Future<SegmentIdWithShardSpec> add(SegmentAllocateRequest request)
+  {
+    if (!isLeader.get()) {
+      throw new ISE("Cannot allocate segment if not leader.");
+    } else if (!isEnabled()) {
+      throw new ISE("Batched segment allocation is disabled.");
+    }
+
+    final AllocateRequestKey requestKey = getKeyForAvailableBatch(request);
+    final AtomicReference<Future<SegmentIdWithShardSpec>> futureReference = new AtomicReference<>();
+
+    // Possible race condition:
+    // t1 -> new batch is added to queue or batch already exists in queue
+    // t2 -> executor pops batch, processes all requests in it
+    // t1 -> new request is added to dangling batch and is never picked up
+    // Solution: For existing batch, call keyToBatch.remove() on the key to
+    // wait on keyToBatch.compute() to finish before proceeding with processBatch().
+    // For new batch, keyToBatch.remove() would not wait as key is not in map yet
+    // but a new batch is unlikely to be due immediately, so it won't get popped right away.
+    keyToBatch.compute(requestKey, (key, existingBatch) -> {
+      if (existingBatch == null) {
+        AllocateRequestBatch newBatch = new AllocateRequestBatch(key);
+        futureReference.set(newBatch.add(request));
+        return addBatchToQueue(newBatch) ? newBatch : null;
+      } else {
+        futureReference.set(existingBatch.add(request));
+        return existingBatch;
+      }
+    });
+
+    return futureReference.get();
+  }
+
+  /**
+   * Returns the key for a batch that is not added to the queue yet and/or has
+   * available space. Throws an exception if the queue is already full and no
+   * batch has available capacity.
+   */
+  private AllocateRequestKey getKeyForAvailableBatch(SegmentAllocateRequest request)
+  {
+    for (int batchIncrementalId = 0; batchIncrementalId < MAX_QUEUE_SIZE; ++batchIncrementalId) {
+      AllocateRequestKey nextKey = new AllocateRequestKey(request, maxWaitTimeMillis, batchIncrementalId);
+      AllocateRequestBatch nextBatch = keyToBatch.get(nextKey);
+      if (nextBatch == null || nextBatch.size() < MAX_BATCH_SIZE) {
+        return nextKey;
+      }
+    }
+
+    throw new ISE("Allocation queue is at capacity, all batches are full.");
+  }
+
+  /**
+   * Tries to add the given batch to the processing queue. Fails all the pending
+   * requests in the batch if we are not leader or if the queue is full.
+   */
+  private boolean addBatchToQueue(AllocateRequestBatch batch)
+  {
+    batch.key.resetQueueTime();
+    if (!isLeader.get()) {
+      batch.failPendingRequests("Cannot allocate segment if not leader");
+      return false;
+    } else if (processingQueue.offer(batch.key)) {
+      log.debug("Added a new batch [%s] to queue.", batch.key);
+      return true;
+    } else {
+      batch.failPendingRequests(
+          "Segment allocation queue is full. Check the metric `task/action/batch/runTime` "
+          + "to determine if metadata operations are slow."
+      );
+      return false;
+    }
+  }
+
+  /**
+   * Tries to add the given batch to the processing queue. If a batch already
+   * exists for this key, transfers all the requests from this batch to the
+   * existing one.
+   */
+  private void requeueBatch(AllocateRequestBatch batch)
+  {
+    log.info("Requeueing [%d] failed requests in batch [%s].", batch.size(), batch.key);
+    keyToBatch.compute(batch.key, (key, existingBatch) -> {
+      if (existingBatch == null) {
+        return addBatchToQueue(batch) ? batch : null;
+      } else {
+        // Merge requests from this batch to existing one
+        existingBatch.transferRequestsFrom(batch);
+        return existingBatch;
+      }
+    });
+  }
+
+  private void processBatchesDue()
+  {
+    clearQueueIfNotLeader();
+
+    // Process all batches which are due
+    log.debug("Processing batches which are due. Queue size [%d].", processingQueue.size());
+    int numProcessedBatches = 0;
+
+    AllocateRequestKey nextKey = processingQueue.peekFirst();
+    while (nextKey != null && nextKey.isDue()) {
+      processingQueue.pollFirst();
+      AllocateRequestBatch nextBatch = keyToBatch.remove(nextKey);
+
+      boolean processed;
+      try {
+        processed = processBatch(nextBatch);
+      }
+      catch (Throwable t) {
+        nextBatch.failPendingRequests(t);
+        processed = true;
+        log.error(t, "Error while processing batch [%s]", nextKey);
+      }
+
+      // Requeue if not fully processed yet
+      if (processed) {
+        ++numProcessedBatches;
+      } else {
+        requeueBatch(nextBatch);
+      }
+
+      nextKey = processingQueue.peek();
+    }
+
+    // Schedule the next round of processing
+    final long nextScheduleDelay;
+    if (processingQueue.isEmpty()) {
+      nextScheduleDelay = maxWaitTimeMillis;
+    } else {
+      nextKey = processingQueue.peek();
+      long timeElapsed = System.currentTimeMillis() - nextKey.getQueueTime();
+      nextScheduleDelay = Math.max(0, maxWaitTimeMillis - timeElapsed);
+    }
+    scheduleQueuePoll(nextScheduleDelay);
+    log.info("Processed [%d] batches, next execution in [%d ms]", numProcessedBatches, nextScheduleDelay);
+  }
+
+  /**
+   * Removes items from the queue as long as we are not leader.
+   */
+  private void clearQueueIfNotLeader()
+  {
+    int failedBatches = 0;
+    AllocateRequestKey nextKey = processingQueue.peekFirst();
+    while (nextKey != null && !isLeader.get()) {
+      processingQueue.pollFirst();
+      AllocateRequestBatch nextBatch = keyToBatch.remove(nextKey);
+      nextBatch.failPendingRequests("Cannot allocate segment if not leader");
+      ++failedBatches;
+
+      nextKey = processingQueue.peekFirst();
+    }
+    if (failedBatches > 0) {
+      log.info("Not leader. Failed [%d] batches, remaining in queue [%d].", failedBatches, processingQueue.size());
+    }
+  }
+
+  /**
+   * Processes the given batch. Returns true if the batch was completely processed
+   * and should not be requeued.
+   */
+  private boolean processBatch(AllocateRequestBatch requestBatch)
+  {
+    final AllocateRequestKey requestKey = requestBatch.key;
+    if (requestBatch.isEmpty()) {
+      return true;
+    } else if (!isLeader.get()) {
+      requestBatch.failPendingRequests("Cannot allocate segment if not leader");
+      return true;
+    }
+
+    log.debug(
+        "Processing [%d] requests for batch [%s], queue time [%s].",
+        requestBatch.size(),
+        requestKey,
+        requestKey.getQueueTime()
+    );
+
+    final long startTimeMillis = System.currentTimeMillis();
+    final int batchSize = requestBatch.size();
+    emitBatchMetric("task/action/batch/size", batchSize, requestKey);
+    emitBatchMetric("task/action/batch/queueTime", (startTimeMillis - requestKey.getQueueTime()), requestKey);
+
+    final Set<DataSegment> usedSegments = retrieveUsedSegments(requestKey);
+    final int successCount = allocateSegmentsForBatch(requestBatch, usedSegments);
+
+    emitBatchMetric("task/action/batch/attempts", 1L, requestKey);
+    emitBatchMetric("task/action/batch/runTime", (System.currentTimeMillis() - startTimeMillis), requestKey);
+    log.info("Successfully processed [%d / %d] requests in batch [%s].", successCount, batchSize, requestKey);
+
+    if (requestBatch.isEmpty()) {
+      log.debug("All requests in batch [%s] have been processed.", requestKey);
+      return true;
+    }
+
+    // Requeue the batch only if used segments have changed
+    log.debug("There are [%d] failed requests in batch [%s].", requestBatch.size(), requestKey);
+    final Set<DataSegment> updatedUsedSegments = retrieveUsedSegments(requestKey);
+
+    if (updatedUsedSegments.equals(usedSegments)) {
+      requestBatch.failPendingRequests("Allocation failed probably due to conflicting segments.");
+      return true;
+    } else {
+      log.debug("Used segments have changed. Requeuing failed requests.");
+      return false;
+    }
+  }
+
+  private Set<DataSegment> retrieveUsedSegments(AllocateRequestKey key)
+  {
+    return new HashSet<>(
+        metadataStorage.retrieveUsedSegmentsForInterval(
+            key.dataSource,
+            key.preferredAllocationInterval,
+            Segments.ONLY_VISIBLE
+        )
+    );
+  }
+
+  private int allocateSegmentsForBatch(AllocateRequestBatch requestBatch, Set<DataSegment> usedSegments)
+  {
+    int successCount = 0;
+
+    // Find requests whose row interval overlaps with an existing used segment
+    final Set<SegmentAllocateRequest> allRequests = requestBatch.getRequests();
+    final Set<SegmentAllocateRequest> requestsWithNoOverlappingSegment = new HashSet<>();
+
+    if (usedSegments.isEmpty()) {
+      requestsWithNoOverlappingSegment.addAll(allRequests);
+    } else {
+      final Interval[] sortedUsedSegmentIntervals = getSortedIntervals(usedSegments);
+      final Map<Interval, List<SegmentAllocateRequest>> overlapIntervalToRequests = new HashMap<>();
+
+      for (SegmentAllocateRequest request : allRequests) {
+        // If there is an overlapping used segment, the interval of the used segment
+        // is the only candidate for allocation for this request
+        final Interval overlappingInterval = Intervals.findOverlappingInterval(
+            request.getRowInterval(),
+            sortedUsedSegmentIntervals
+        );
+
+        if (overlappingInterval == null) {
+          requestsWithNoOverlappingSegment.add(request);
+        } else if (overlappingInterval.contains(request.getRowInterval())) {
+          // Found an enclosing interval, use this for allocation
+          overlapIntervalToRequests.computeIfAbsent(overlappingInterval, i -> new ArrayList<>())
+                                   .add(request);
+        } else {
+          // There is no valid allocation interval for this request due to a
+          // partially overlapping used segment. Need not do anything right now.
+          // The request will be retried upon requeueing the batch.
+        }
+      }
+
+      // Try to allocate segments for the identified used segment intervals.
+      // Do not retry the failed requests with other intervals unless the batch is requeued.
+      for (Map.Entry<Interval, List<SegmentAllocateRequest>> entry : overlapIntervalToRequests.entrySet()) {
+        successCount += allocateSegmentsForInterval(
+            entry.getKey(),
+            entry.getValue(),
+            requestBatch
+        );
+      }
+    }
+
+    // For requests that do not overlap with a used segment, first try to allocate
+    // using the preferred granularity, then smaller granularities
+    final Set<SegmentAllocateRequest> pendingRequests = new HashSet<>(requestsWithNoOverlappingSegment);
+    for (Granularity granularity :
+        Granularity.granularitiesFinerThan(requestBatch.key.preferredSegmentGranularity)) {
+      Map<Interval, List<SegmentAllocateRequest>> requestsByInterval =
+          getRequestsByInterval(pendingRequests, granularity);
+
+      for (Map.Entry<Interval, List<SegmentAllocateRequest>> entry : requestsByInterval.entrySet()) {
+        successCount += allocateSegmentsForInterval(
+            entry.getKey(),
+            entry.getValue(),
+            requestBatch
+        );
+        pendingRequests.retainAll(requestBatch.getRequests());
+      }
+    }
+
+    return successCount;
+  }
+
+  private Interval[] getSortedIntervals(Set<DataSegment> usedSegments)
+  {
+    TreeSet<Interval> sortedSet = new TreeSet<>(Comparators.intervalsByStartThenEnd());
+    usedSegments.forEach(segment -> sortedSet.add(segment.getInterval()));
+    return sortedSet.toArray(new Interval[0]);
+  }
+
+  /**
+   * Tries to allocate segments for the given requests over the specified interval.
+   * Returns the number of requests for which segments were successfully allocated.
+   */
+  private int allocateSegmentsForInterval(
+      Interval tryInterval,
+      List<SegmentAllocateRequest> requests,
+      AllocateRequestBatch requestBatch
+  )
+  {
+    if (requests.isEmpty()) {
+      return 0;
+    }
+
+    final AllocateRequestKey requestKey = requestBatch.key;
+    log.debug(
+        "Trying allocation for [%d] requests, interval [%s] in batch [%s]",
+        requests.size(),
+        tryInterval,
+        requestKey
+    );
+
+    final List<SegmentAllocateResult> results = taskLockbox.allocateSegments(
+        requests,
+        requestKey.dataSource,
+        tryInterval,
+        requestKey.skipSegmentLineageCheck,
+        requestKey.lockGranularity
+    );
+
+    int successfulRequests = 0;
+    for (int i = 0; i < requests.size(); ++i) {
+      SegmentAllocateRequest request = requests.get(i);
+      SegmentAllocateResult result = results.get(i);
+      if (result.isSuccess()) {
+        ++successfulRequests;
+      }
+
+      requestBatch.handleResult(result, request);
+    }
+
+    return successfulRequests;
+  }
+
+  private Map<Interval, List<SegmentAllocateRequest>> getRequestsByInterval(
+      Set<SegmentAllocateRequest> requests,
+      Granularity tryGranularity
+  )
+  {
+    final Map<Interval, List<SegmentAllocateRequest>> tryIntervalToRequests = new HashMap<>();
+    for (SegmentAllocateRequest request : requests) {
+      Interval tryInterval = tryGranularity.bucket(request.getAction().getTimestamp());
+      if (tryInterval.contains(request.getRowInterval())) {
+        tryIntervalToRequests.computeIfAbsent(tryInterval, i -> new ArrayList<>()).add(request);
+      }
+    }
+    return tryIntervalToRequests;
+  }
+
+  private void emitTaskMetric(String metric, long value, SegmentAllocateRequest request)
+  {
+    final ServiceMetricEvent.Builder metricBuilder = ServiceMetricEvent.builder();
+    IndexTaskUtils.setTaskDimensions(metricBuilder, request.getTask());
+    metricBuilder.setDimension("taskActionType", SegmentAllocateAction.TYPE);
+    emitter.emit(metricBuilder.build(metric, value));
+  }
+
+  private void emitBatchMetric(String metric, long value, AllocateRequestKey key)
+  {
+    final ServiceMetricEvent.Builder metricBuilder = ServiceMetricEvent.builder();
+    metricBuilder.setDimension("taskActionType", SegmentAllocateAction.TYPE);
+    metricBuilder.setDimension(DruidMetrics.DATASOURCE, key.dataSource);
+    metricBuilder.setDimension(DruidMetrics.INTERVAL, key.preferredAllocationInterval.toString());
+    emitter.emit(metricBuilder.build(metric, value));
+  }
+
+  /**
+   * A batch of segment allocation requests.
+   */
+  private class AllocateRequestBatch
+  {
+    private final AllocateRequestKey key;
+
+    /**
+     * Map from allocate requests (represents a single SegmentAllocateAction)
+     * to the future of allocated segment id.
+     * <p>
+     * This must be accessed through methods synchronized on this batch.
+     * It is to avoid races between a new request being added just when the batch
+     * is being processed.
+     */
+    private final Map<SegmentAllocateRequest, CompletableFuture<SegmentIdWithShardSpec>>
+        requestToFuture = new HashMap<>();
+
+    AllocateRequestBatch(AllocateRequestKey key)
+    {
+      this.key = key;
+    }
+
+    synchronized Future<SegmentIdWithShardSpec> add(SegmentAllocateRequest request)
+    {
+      log.debug("Adding request to batch [%s]: %s", key, request.getAction());
+      return requestToFuture.computeIfAbsent(request, req -> new CompletableFuture<>());
+    }
+
+    synchronized void transferRequestsFrom(AllocateRequestBatch batch)
+    {
+      requestToFuture.putAll(batch.requestToFuture);
+      batch.requestToFuture.clear();
+    }
+
+    synchronized Set<SegmentAllocateRequest> getRequests()
+    {
+      return new HashSet<>(requestToFuture.keySet());
+    }
+
+    synchronized void failPendingRequests(String reason)
+    {
+      failPendingRequests(new ISE(reason));
+    }
+
+    synchronized void failPendingRequests(Throwable cause)
+    {
+      if (!requestToFuture.isEmpty()) {
+        log.warn("Failing [%d] requests in batch due to [%s]. Batch key: %s", size(), cause.getMessage(), key);
+        requestToFuture.values().forEach(future -> future.completeExceptionally(cause));
+        requestToFuture.keySet().forEach(
+            request -> emitTaskMetric("task/action/failed/count", 1L, request)
+        );
+        requestToFuture.clear();
+      }
+    }
+
+    synchronized void handleResult(SegmentAllocateResult result, SegmentAllocateRequest request)
+    {
+      request.incrementAttempts();
+
+      if (result.isSuccess()) {
+        emitTaskMetric("task/action/success/count", 1L, request);
+        requestToFuture.remove(request).complete(result.getSegmentId());
+      } else if (request.canRetry()) {
+        log.info(
+            "Allocation failed in attempt [%d] due to error [%s]. Can still retry. Action: %s",
+            request.getAttempts(),
+            result.getErrorMessage(),
+            request.getAction()
+        );
+      } else {
+        emitTaskMetric("task/action/failed/count", 1L, request);
+        log.error(
+            "Failing allocate action after [%d] attempts. Latest error [%s]. Action: %s",
+            request.getAttempts(),
+            result.getErrorMessage(),
+            request.getAction()
+        );
+        requestToFuture.remove(request).completeExceptionally(new ISE(result.getErrorMessage()));
+      }
+    }
+
+    synchronized boolean isEmpty()
+    {
+      return requestToFuture.isEmpty();
+    }
+
+    synchronized int size()
+    {
+      return requestToFuture.size();
+    }
+  }
+
+  /**
+   * Key to identify a batch of allocation requests.
+   */
+  private static class AllocateRequestKey
+  {
+    /**
+     * ID to distinguish between two batches for the same datasource, groupId, etc.
+     */
+    private final int batchIncrementalId;
+
+    private long queueTimeMillis;
+    private final long maxWaitTimeMillis;
+
+    private final String dataSource;
+    private final String groupId;
+    private final Interval preferredAllocationInterval;
+    private final Granularity preferredSegmentGranularity;
+
+    private final boolean skipSegmentLineageCheck;
+    private final LockGranularity lockGranularity;
+
+    private final boolean useNonRootGenPartitionSpace;
+
+    private final int hash;
+
+    /**
+     * Creates a new key for the given request. The batch for a unique key will
+     * always contain a single request.
+     */
+    AllocateRequestKey(SegmentAllocateRequest request, long maxWaitTimeMillis, int batchIncrementalId)
+    {
+      final SegmentAllocateAction action = request.getAction();
+      final Task task = request.getTask();
+
+      this.batchIncrementalId = batchIncrementalId;
+      this.dataSource = action.getDataSource();
+      this.groupId = task.getGroupId();
+      this.skipSegmentLineageCheck = action.isSkipSegmentLineageCheck();
+      this.lockGranularity = action.getLockGranularity();
+      this.useNonRootGenPartitionSpace = action.getPartialShardSpec()
+                                               .useNonRootGenerationPartitionSpace();
+      this.preferredSegmentGranularity = action.getPreferredSegmentGranularity();
+      this.preferredAllocationInterval = action.getPreferredSegmentGranularity()
+                                               .bucket(action.getTimestamp());
+
+      this.hash = Objects.hash(
+          dataSource,
+          groupId,
+          batchIncrementalId,
+          skipSegmentLineageCheck,
+          useNonRootGenPartitionSpace,
+          preferredAllocationInterval,
+          lockGranularity
+      );
+
+      this.maxWaitTimeMillis = maxWaitTimeMillis;
+    }
+
+    void resetQueueTime()
+    {
+      queueTimeMillis = System.currentTimeMillis();
+    }
+
+    long getQueueTime()
+    {
+      return queueTimeMillis;
+    }
+
+    boolean isDue()
+    {
+      return System.currentTimeMillis() - queueTimeMillis >= maxWaitTimeMillis;
+    }
+
+    @Override
+    public boolean equals(Object o)
+    {
+      if (this == o) {
+        return true;
+      }
+      if (o == null || getClass() != o.getClass()) {
+        return false;
+      }
+      AllocateRequestKey that = (AllocateRequestKey) o;
+      return dataSource.equals(that.dataSource)
+             && groupId.equals(that.groupId)
+             && batchIncrementalId == that.batchIncrementalId
+             && skipSegmentLineageCheck == that.skipSegmentLineageCheck
+             && useNonRootGenPartitionSpace == that.useNonRootGenPartitionSpace
+             && preferredAllocationInterval.equals(that.preferredAllocationInterval)
+             && lockGranularity == that.lockGranularity;
+    }
+
+    @Override
+    public int hashCode()
+    {
+      return hash;
+    }
+
+    @Override
+    public String toString()
+    {
+      return "{" +
+             "ds='" + dataSource + '\'' +
+             ", gr='" + groupId + '\'' +
+             ", incId=" + batchIncrementalId +
+             ", lock=" + lockGranularity +
+             ", invl=" + preferredAllocationInterval +
+             ", slc=" + skipSegmentLineageCheck +
+             '}';
+    }
+  }
+}
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
index 559039d96ef6..18e373727790 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskAction.java
@@ -24,6 +24,8 @@
 import com.fasterxml.jackson.core.type.TypeReference;
 import org.apache.druid.indexing.common.task.Task;
 
+import java.util.concurrent.Future;
+
 @JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = TaskAction.TYPE_FIELD)
 @JsonSubTypes(value = {
     @JsonSubTypes.Type(name = "lockAcquire", value = TimeChunkLockAcquireAction.class),
@@ -58,6 +60,16 @@ public interface TaskAction<RetType>
 
   boolean isAudited();
 
+  default boolean canPerformAsync(Task task, TaskActionToolbox toolbox)
+  {
+    return false;
+  }
+
+  default Future<RetType> performAsync(Task task, TaskActionToolbox toolbox)
+  {
+    throw new UnsupportedOperationException();
+  }
+
   @Override
   String toString();
 }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskActionToolbox.java b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskActionToolbox.java
index 134a9bf6c72e..7d001ecbcb9a 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskActionToolbox.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/common/actions/TaskActionToolbox.java
@@ -35,6 +35,7 @@ public class TaskActionToolbox
 {
   private final TaskLockbox taskLockbox;
   private final TaskStorage taskStorage;
+  private final SegmentAllocationQueue segmentAllocationQueue;
   private final IndexerMetadataStorageCoordinator indexerMetadataStorageCoordinator;
   private final ServiceEmitter emitter;
   private final SupervisorManager supervisorManager;
@@ -46,6 +47,7 @@ public TaskActionToolbox(
       TaskLockbox taskLockbox,
       TaskStorage taskStorage,
       IndexerMetadataStorageCoordinator indexerMetadataStorageCoordinator,
+      SegmentAllocationQueue segmentAllocationQueue,
       ServiceEmitter emitter,
       SupervisorManager supervisorManager,
       @Json ObjectMapper jsonMapper
@@ -57,6 +59,27 @@ public TaskActionToolbox(
     this.emitter = emitter;
     this.supervisorManager = supervisorManager;
     this.jsonMapper = jsonMapper;
+    this.segmentAllocationQueue = segmentAllocationQueue;
+  }
+
+  public TaskActionToolbox(
+      TaskLockbox taskLockbox,
+      TaskStorage taskStorage,
+      IndexerMetadataStorageCoordinator indexerMetadataStorageCoordinator,
+      ServiceEmitter emitter,
+      SupervisorManager supervisorManager,
+      @Json ObjectMapper jsonMapper
+  )
+  {
+    this(
+        taskLockbox,
+        taskStorage,
+        indexerMetadataStorageCoordinator,
+        null,
+        emitter,
+        supervisorManager,
+        jsonMapper
+    );
   }
 
   public TaskLockbox getTaskLockbox()
@@ -103,4 +126,13 @@ public Optional<TaskRunner> getTaskRunner()
     return Optional.absent();
   }
 
+  public SegmentAllocationQueue getSegmentAllocationQueue()
+  {
+    return segmentAllocationQueue;
+  }
+
+  public boolean canBatchSegmentAllocation()
+  {
+    return segmentAllocationQueue != null && segmentAllocationQueue.isEnabled();
+  }
 }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/overlord/TaskLockbox.java b/indexing-service/src/main/java/org/apache/druid/indexing/overlord/TaskLockbox.java
index 24eebec94471..ca4d4526557b 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/overlord/TaskLockbox.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/overlord/TaskLockbox.java
@@ -20,7 +20,6 @@
 package org.apache.druid.indexing.overlord;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Function;
 import com.google.common.base.Objects;
 import com.google.common.base.Preconditions;
 import com.google.common.collect.ComparisonChain;
@@ -34,9 +33,13 @@
 import org.apache.druid.indexing.common.TaskLock;
 import org.apache.druid.indexing.common.TaskLockType;
 import org.apache.druid.indexing.common.TimeChunkLock;
+import org.apache.druid.indexing.common.actions.SegmentAllocateAction;
+import org.apache.druid.indexing.common.actions.SegmentAllocateRequest;
+import org.apache.druid.indexing.common.actions.SegmentAllocateResult;
 import org.apache.druid.indexing.common.task.Task;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Pair;
+import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.guava.Comparators;
 import org.apache.druid.java.util.emitter.EmittingLogger;
 import org.apache.druid.segment.realtime.appenderator.SegmentIdWithShardSpec;
@@ -446,6 +449,140 @@ public LockResult tryLock(final Task task, final LockRequest request)
     }
   }
 
+  /**
+   * Attempts to allocate segments for the given requests. Each request contains
+   * a {@link Task} and a {@link SegmentAllocateAction}. This method tries to
+   * acquire the task locks on the required intervals/segments and then performs
+   * a batch allocation of segments. It is possible that some requests succeed
+   * successfully and others failed. In that case, only the failed ones should be
+   * retried.
+   *
+   * @param requests                List of allocation requests
+   * @param dataSource              Datasource for which segment is to be allocated.
+   * @param interval                Interval for which segment is to be allocated.
+   * @param skipSegmentLineageCheck Whether lineage check is to be skipped
+   *                                (this is true for streaming ingestion)
+   * @param lockGranularity         Granularity of task lock
+   * @return List of allocation results in the same order as the requests.
+   */
+  public List<SegmentAllocateResult> allocateSegments(
+      List<SegmentAllocateRequest> requests,
+      String dataSource,
+      Interval interval,
+      boolean skipSegmentLineageCheck,
+      LockGranularity lockGranularity
+  )
+  {
+    log.info("Allocating [%d] segments for datasource [%s], interval [%s]", requests.size(), dataSource, interval);
+    final boolean isTimeChunkLock = lockGranularity == LockGranularity.TIME_CHUNK;
+
+    final AllocationHolderList holderList = new AllocationHolderList(requests, interval);
+    holderList.getPending().forEach(this::verifyTaskIsActive);
+
+    giant.lock();
+    try {
+      if (isTimeChunkLock) {
+        // For time-chunk locking, segment must be allocated only after acquiring the lock
+        holderList.getPending().forEach(holder -> acquireTaskLock(holder, true));
+        allocateSegmentIds(dataSource, interval, skipSegmentLineageCheck, holderList.getPending());
+      } else {
+        allocateSegmentIds(dataSource, interval, skipSegmentLineageCheck, holderList.getPending());
+        holderList.getPending().forEach(holder -> acquireTaskLock(holder, false));
+      }
+
+      holderList.getPending().forEach(holder -> addTaskAndPersistLocks(holder, isTimeChunkLock));
+    }
+    finally {
+      giant.unlock();
+    }
+
+    return holderList.getResults();
+  }
+
+  /**
+   * Marks the segment allocation as failed if the underlying task is not active.
+   */
+  private void verifyTaskIsActive(SegmentAllocationHolder holder)
+  {
+    final String taskId = holder.task.getId();
+    if (!activeTasks.contains(taskId)) {
+      holder.markFailed("Unable to grant lock to inactive Task [%s]", taskId);
+    }
+  }
+
+  /**
+   * Creates a task lock request and creates or finds the lock for that request.
+   * Marks the segment allocation as failed if the lock could not be acquired or
+   * was revoked.
+   */
+  private void acquireTaskLock(SegmentAllocationHolder holder, boolean isTimeChunkLock)
+  {
+    final LockRequest lockRequest;
+    if (isTimeChunkLock) {
+      lockRequest = new TimeChunkLockRequest(holder.lockRequest);
+    } else {
+      lockRequest = new SpecificSegmentLockRequest(holder.lockRequest, holder.allocatedSegment);
+    }
+
+    // Create or find the task lock for the created lock request
+    final TaskLockPosse posseToUse = createOrFindLockPosse(lockRequest);
+    final TaskLock acquiredLock = posseToUse == null ? null : posseToUse.getTaskLock();
+    if (posseToUse == null) {
+      holder.markFailed("Could not find or create lock posse.");
+    } else if (acquiredLock.isRevoked()) {
+      holder.markFailed("Lock was revoked.");
+    } else {
+      holder.setAcquiredLock(posseToUse, lockRequest.getInterval());
+    }
+  }
+
+  /**
+   * Adds the task to the found lock posse if not already added and updates
+   * in the metadata store. Marks the segment allocation as failed if the update
+   * did not succeed.
+   */
+  private void addTaskAndPersistLocks(SegmentAllocationHolder holder, boolean isTimeChunkLock)
+  {
+    final Task task = holder.task;
+    final TaskLock acquiredLock = holder.acquiredLock;
+
+    if (holder.taskLockPosse.addTask(task)) {
+      log.info("Added task [%s] to TaskLock [%s]", task.getId(), acquiredLock);
+
+      // This can also be batched later
+      boolean success = updateLockInStorage(task, acquiredLock);
+      if (success) {
+        holder.markSucceeded();
+      } else {
+        final Integer partitionId = isTimeChunkLock
+                                    ? null : ((SegmentLock) acquiredLock).getPartitionId();
+        unlock(task, holder.lockRequestInterval, partitionId);
+        holder.markFailed("Could not update task lock in metadata store.");
+      }
+    } else {
+      log.info("Task [%s] already present in TaskLock [%s]", task.getId(), acquiredLock.getGroupId());
+      holder.markSucceeded();
+    }
+  }
+
+  private boolean updateLockInStorage(Task task, TaskLock taskLock)
+  {
+    try {
+      taskStorage.addLock(task.getId(), taskLock);
+      return true;
+    }
+    catch (Exception e) {
+      log.makeAlert("Failed to persist lock in storage")
+         .addData("task", task.getId())
+         .addData("dataSource", taskLock.getDataSource())
+         .addData("interval", taskLock.getInterval())
+         .addData("version", taskLock.getVersion())
+         .emit();
+
+      return false;
+    }
+  }
+
   private TaskLockPosse createOrFindLockPosse(LockRequest request)
   {
     Preconditions.checkState(!(request instanceof LockRequestForNewSegment), "Can't handle LockRequestForNewSegment");
@@ -541,7 +678,6 @@ && areAllEqualOrHigherPriorityLocksSharedOrRevoked(conflictPosses, request.getPr
    * monotonicity and that callers specifying {@code preferredVersion} are doing the right thing.
    *
    * @param request request to lock
-   *
    * @return a new {@link TaskLockPosse}
    */
   private TaskLockPosse createNewTaskLockPosse(LockRequest request)
@@ -550,7 +686,10 @@ private TaskLockPosse createNewTaskLockPosse(LockRequest request)
     try {
       final TaskLockPosse posseToUse = new TaskLockPosse(request.toLock());
       running.computeIfAbsent(request.getDataSource(), k -> new TreeMap<>())
-             .computeIfAbsent(request.getInterval().getStart(), k -> new TreeMap<>(Comparators.intervalsByStartThenEnd()))
+             .computeIfAbsent(
+                 request.getInterval().getStart(),
+                 k -> new TreeMap<>(Comparators.intervalsByStartThenEnd())
+             )
              .computeIfAbsent(request.getInterval(), k -> new ArrayList<>())
              .add(posseToUse);
 
@@ -561,6 +700,45 @@ private TaskLockPosse createNewTaskLockPosse(LockRequest request)
     }
   }
 
+  /**
+   * Makes a call to the {@link #metadataStorageCoordinator} to allocate segments
+   * for the given requests. Updates the holder with the allocated segment if
+   * the allocation succeeds, otherwise marks it as failed.
+   */
+  private void allocateSegmentIds(
+      String dataSource,
+      Interval interval,
+      boolean skipSegmentLineageCheck,
+      Collection<SegmentAllocationHolder> holders
+  )
+  {
+    if (holders.isEmpty()) {
+      return;
+    }
+
+    final List<SegmentCreateRequest> createRequests =
+        holders.stream()
+               .map(SegmentAllocationHolder::getSegmentRequest)
+               .collect(Collectors.toList());
+
+    Map<SegmentCreateRequest, SegmentIdWithShardSpec> allocatedSegments =
+        metadataStorageCoordinator.allocatePendingSegments(
+            dataSource,
+            interval,
+            skipSegmentLineageCheck,
+            createRequests
+        );
+
+    for (SegmentAllocationHolder holder : holders) {
+      SegmentIdWithShardSpec segmentId = allocatedSegments.get(holder.getSegmentRequest());
+      if (segmentId == null) {
+        holder.markFailed("Storage coordinator could not allocate segment.");
+      } else {
+        holder.setAllocatedSegment(segmentId);
+      }
+    }
+  }
+
   private SegmentIdWithShardSpec allocateSegmentId(LockRequestForNewSegment request, String version)
   {
     return metadataStorageCoordinator.allocatePendingSegment(
@@ -577,7 +755,7 @@ private SegmentIdWithShardSpec allocateSegmentId(LockRequestForNewSegment reques
   /**
    * Perform the given action with a guarantee that the locks of the task are not revoked in the middle of action.  This
    * method first checks that all locks for the given task and intervals are valid and perform the right action.
-   *
+   * <p>
    * The given action should be finished as soon as possible because all other methods in this class are blocked until
    * this method is finished.
    *
@@ -611,7 +789,7 @@ private boolean isTaskLocksValid(Task task, List<Interval> intervals)
           .allMatch(interval -> {
             final List<TaskLockPosse> lockPosses = getOnlyTaskLockPosseContainingInterval(task, interval);
             return lockPosses.stream().map(TaskLockPosse::getTaskLock).noneMatch(
-                lock -> lock.isRevoked()
+                TaskLock::isRevoked
             );
           });
     }
@@ -664,7 +842,9 @@ protected void revokeLock(String taskId, TaskLock lock)
         final TaskLock revokedLock = lock.revokedCopy();
         taskStorage.replaceLock(taskId, lock, revokedLock);
 
-        final List<TaskLockPosse> possesHolder = running.get(task.getDataSource()).get(lock.getInterval().getStart()).get(lock.getInterval());
+        final List<TaskLockPosse> possesHolder = running.get(task.getDataSource())
+                                                        .get(lock.getInterval().getStart())
+                                                        .get(lock.getInterval());
         final TaskLockPosse foundPosse = possesHolder.stream()
                                                      .filter(posse -> posse.getTaskLock().equals(lock))
                                                      .findFirst()
@@ -692,16 +872,7 @@ public List<TaskLock> findLocksForTask(final Task task)
     giant.lock();
 
     try {
-      return Lists.transform(
-          findLockPossesForTask(task), new Function<TaskLockPosse, TaskLock>()
-          {
-            @Override
-            public TaskLock apply(TaskLockPosse taskLockPosse)
-            {
-              return taskLockPosse.getTaskLock();
-            }
-          }
-      );
+      return Lists.transform(findLockPossesForTask(task), TaskLockPosse::getTaskLock);
     }
     finally {
       giant.unlock();
@@ -778,7 +949,7 @@ public void unlock(final Task task, final Interval interval)
    * Release lock held for a task on a particular interval. Does nothing if the task does not currently
    * hold the mentioned lock.
    *
-   * @param task task to unlock
+   * @param task     task to unlock
    * @param interval interval to unlock
    */
   public void unlock(final Task task, final Interval interval, @Nullable Integer partitionId)
@@ -1233,7 +1404,7 @@ public boolean equals(Object o)
 
       TaskLockPosse that = (TaskLockPosse) o;
       return java.util.Objects.equals(taskLock, that.taskLock) &&
-              java.util.Objects.equals(taskIds, that.taskIds);
+             java.util.Objects.equals(taskIds, that.taskIds);
     }
 
     @Override
@@ -1251,4 +1422,121 @@ public String toString()
                     .toString();
     }
   }
+
+  /**
+   * Maintains a list of pending allocation holders.
+   */
+  private static class AllocationHolderList
+  {
+    final List<SegmentAllocationHolder> all = new ArrayList<>();
+    final Set<SegmentAllocationHolder> pending = new HashSet<>();
+    final Set<SegmentAllocationHolder> recentlyCompleted = new HashSet<>();
+
+    AllocationHolderList(List<SegmentAllocateRequest> requests, Interval interval)
+    {
+      for (SegmentAllocateRequest request : requests) {
+        SegmentAllocationHolder holder = new SegmentAllocationHolder(request, interval, this);
+        all.add(holder);
+        pending.add(holder);
+      }
+    }
+
+    void markCompleted(SegmentAllocationHolder holder)
+    {
+      recentlyCompleted.add(holder);
+    }
+
+    Set<SegmentAllocationHolder> getPending()
+    {
+      pending.removeAll(recentlyCompleted);
+      recentlyCompleted.clear();
+      return pending;
+    }
+
+
+    List<SegmentAllocateResult> getResults()
+    {
+      return all.stream().map(holder -> holder.result).collect(Collectors.toList());
+    }
+  }
+
+  /**
+   * Contains the task, request, lock and final result for a segment allocation.
+   */
+  private static class SegmentAllocationHolder
+  {
+    final AllocationHolderList list;
+
+    final Task task;
+    final Interval allocateInterval;
+    final SegmentAllocateAction action;
+    final LockRequestForNewSegment lockRequest;
+    SegmentCreateRequest segmentRequest;
+
+    TaskLock acquiredLock;
+    TaskLockPosse taskLockPosse;
+    Interval lockRequestInterval;
+    SegmentIdWithShardSpec allocatedSegment;
+    SegmentAllocateResult result;
+
+    SegmentAllocationHolder(SegmentAllocateRequest request, Interval allocateInterval, AllocationHolderList list)
+    {
+      this.list = list;
+      this.allocateInterval = allocateInterval;
+      this.task = request.getTask();
+      this.action = request.getAction();
+
+      this.lockRequest = new LockRequestForNewSegment(
+          action.getLockGranularity(),
+          action.getTaskLockType(),
+          task.getGroupId(),
+          action.getDataSource(),
+          allocateInterval,
+          action.getPartialShardSpec(),
+          task.getPriority(),
+          action.getSequenceName(),
+          action.getPreviousSegmentId(),
+          action.isSkipSegmentLineageCheck()
+      );
+    }
+
+    SegmentCreateRequest getSegmentRequest()
+    {
+      // Initialize the first time this is requested
+      if (segmentRequest == null) {
+        segmentRequest = new SegmentCreateRequest(
+            action.getSequenceName(),
+            action.getPreviousSegmentId(),
+            acquiredLock == null ? lockRequest.getVersion() : acquiredLock.getVersion(),
+            action.getPartialShardSpec()
+        );
+      }
+
+      return segmentRequest;
+    }
+
+    void markFailed(String msgFormat, Object... args)
+    {
+      list.markCompleted(this);
+      result = new SegmentAllocateResult(null, StringUtils.format(msgFormat, args));
+    }
+
+    void markSucceeded()
+    {
+      list.markCompleted(this);
+      result = new SegmentAllocateResult(allocatedSegment, null);
+    }
+
+    void setAllocatedSegment(SegmentIdWithShardSpec segmentId)
+    {
+      this.allocatedSegment = segmentId;
+    }
+
+    void setAcquiredLock(TaskLockPosse lockPosse, Interval lockRequestInterval)
+    {
+      this.taskLockPosse = lockPosse;
+      this.acquiredLock = lockPosse == null ? null : lockPosse.getTaskLock();
+      this.lockRequestInterval = lockRequestInterval;
+    }
+  }
 }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/overlord/TaskMaster.java b/indexing-service/src/main/java/org/apache/druid/indexing/overlord/TaskMaster.java
index 7b9101cf1f22..28c623fdadb4 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/overlord/TaskMaster.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/overlord/TaskMaster.java
@@ -26,6 +26,7 @@
 import org.apache.druid.discovery.DruidLeaderSelector;
 import org.apache.druid.discovery.DruidLeaderSelector.Listener;
 import org.apache.druid.guice.annotations.Self;
+import org.apache.druid.indexing.common.actions.SegmentAllocationQueue;
 import org.apache.druid.indexing.common.actions.TaskActionClient;
 import org.apache.druid.indexing.common.actions.TaskActionClientFactory;
 import org.apache.druid.indexing.common.task.Task;
@@ -91,7 +92,8 @@ public TaskMaster(
       final ServiceEmitter emitter,
       final SupervisorManager supervisorManager,
       final OverlordHelperManager overlordHelperManager,
-      @IndexingService final DruidLeaderSelector overlordLeaderSelector
+      @IndexingService final DruidLeaderSelector overlordLeaderSelector,
+      final SegmentAllocationQueue segmentAllocationQueue
   )
   {
     this.supervisorManager = supervisorManager;
@@ -136,6 +138,22 @@ public void becomeLeader()
           leaderLifecycle.addManagedInstance(taskQueue);
           leaderLifecycle.addManagedInstance(supervisorManager);
           leaderLifecycle.addManagedInstance(overlordHelperManager);
+          leaderLifecycle.addHandler(
+              new Lifecycle.Handler()
+              {
+                @Override
+                public void start()
+                {
+                  segmentAllocationQueue.becomeLeader();
+                }
+
+                @Override
+                public void stop()
+                {
+                  segmentAllocationQueue.stopBeingLeader();
+                }
+              }
+          );
 
           leaderLifecycle.addHandler(
               new Lifecycle.Handler()
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/overlord/config/TaskLockConfig.java b/indexing-service/src/main/java/org/apache/druid/indexing/overlord/config/TaskLockConfig.java
index 96f14759f78a..c860e4e1d156 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/overlord/config/TaskLockConfig.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/overlord/config/TaskLockConfig.java
@@ -30,8 +30,24 @@ public class TaskLockConfig
   @JsonProperty
   private boolean forceTimeChunkLock = true;
 
+  @JsonProperty
+  private boolean batchSegmentAllocation = false;
+
+  @JsonProperty
+  private long batchAllocationWaitTime = 500L;
+
   public boolean isForceTimeChunkLock()
   {
     return forceTimeChunkLock;
   }
+
+  public boolean isBatchSegmentAllocation()
+  {
+    return batchSegmentAllocation;
+  }
+
+  public long getBatchAllocationWaitTime()
+  {
+    return batchAllocationWaitTime;
+  }
 }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java
index 800dbcdeb947..e509699d5ced 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/SeekableStreamIndexTaskRunner.java
@@ -1036,7 +1036,7 @@ public Void apply(@Nullable SegmentsAndCommitMetadata handoffSegmentsAndCommitMe
             }
             task.emitMetric(
                 toolbox.getEmitter(),
-                "ingest/segment/count",
+                "ingest/segments/count",
                 segmentCount
             );
           }
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisor.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisor.java
index 53769f84985a..68cf3bf79646 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisor.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisor.java
@@ -2014,9 +2014,24 @@ private void resumeAllActivelyReadingTasks()
     }
 
     Map<String, ListenableFuture<Boolean>> tasksToResume = new HashMap<>();
+    if (activelyReadingTaskGroups.isEmpty()) {
+      return;
+    }
+    // Resume only running tasks and not pending / waiting ones.
+    if (!taskMaster.getTaskRunner().isPresent()) {
+      return;
+    }
+    Set<String> runningTaskIds = taskMaster.getTaskRunner()
+                                           .get()
+                                           .getRunningTasks()
+                                           .stream()
+                                           .map(TaskRunnerWorkItem::getTaskId)
+                                           .collect(Collectors.toSet());
     for (TaskGroup taskGroup : activelyReadingTaskGroups.values()) {
       for (String taskId : taskGroup.tasks.keySet()) {
-        tasksToResume.put(taskId, taskClient.resumeAsync(taskId));
+        if (runningTaskIds.contains(taskId)) {
+          tasksToResume.put(taskId, taskClient.resumeAsync(taskId));
+        }
       }
     }
 
diff --git a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisorTuningConfig.java b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisorTuningConfig.java
index c74c2952de03..c518887cfbdb 100644
--- a/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisorTuningConfig.java
+++ b/indexing-service/src/main/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisorTuningConfig.java
@@ -26,7 +26,7 @@
 
 public interface SeekableStreamSupervisorTuningConfig
 {
-  boolean DEFAULT_ASYNC = false;
+  boolean DEFAULT_ASYNC = true;
   String DEFAULT_OFFSET_FETCH_PERIOD = "PT30S";
   int DEFAULT_CHAT_RETRIES = 8;
   String DEFAULT_HTTP_TIMEOUT = "PT10S";
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionBuilder.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionBuilder.java
new file mode 100644
index 000000000000..2e9cd70bbdbc
--- /dev/null
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionBuilder.java
@@ -0,0 +1,138 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import org.apache.druid.indexing.common.LockGranularity;
+import org.apache.druid.indexing.common.TaskLockType;
+import org.apache.druid.indexing.common.task.Task;
+import org.apache.druid.java.util.common.DateTimes;
+import org.apache.druid.java.util.common.granularity.Granularity;
+import org.apache.druid.timeline.partition.PartialShardSpec;
+import org.joda.time.DateTime;
+
+public class SegmentAllocateActionBuilder
+{
+  private String dataSource;
+  private DateTime timestamp;
+  private Granularity queryGranularity;
+  private Granularity preferredSegmentGranularity;
+  private String sequenceName;
+  private String previousSegmentId;
+  private boolean skipSegmentLineageCheck;
+  private PartialShardSpec partialShardSpec;
+  private LockGranularity lockGranularity;
+  private TaskLockType taskLockType;
+  private Task task;
+
+  public SegmentAllocateActionBuilder forDatasource(String dataSource)
+  {
+    this.dataSource = dataSource;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder forTimestamp(DateTime timestamp)
+  {
+    this.timestamp = timestamp;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder forTimestamp(String instant)
+  {
+    this.timestamp = DateTimes.of(instant);
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder withQueryGranularity(Granularity queryGranularity)
+  {
+    this.queryGranularity = queryGranularity;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder withSegmentGranularity(Granularity segmentGranularity)
+  {
+    this.preferredSegmentGranularity = segmentGranularity;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder withSequenceName(String sequenceName)
+  {
+    this.sequenceName = sequenceName;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder withPreviousSegmentId(String previousSegmentId)
+  {
+    this.previousSegmentId = previousSegmentId;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder withSkipLineageCheck(boolean skipLineageCheck)
+  {
+    this.skipSegmentLineageCheck = skipLineageCheck;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder withPartialShardSpec(PartialShardSpec partialShardSpec)
+  {
+    this.partialShardSpec = partialShardSpec;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder withLockGranularity(LockGranularity lockGranularity)
+  {
+    this.lockGranularity = lockGranularity;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder withTaskLockType(TaskLockType taskLockType)
+  {
+    this.taskLockType = taskLockType;
+    return this;
+  }
+
+  public SegmentAllocateActionBuilder forTask(Task task)
+  {
+    this.dataSource = task.getDataSource();
+    this.sequenceName = task.getId();
+    this.task = task;
+    return this;
+  }
+
+  public SegmentAllocateRequest build()
+  {
+    return new SegmentAllocateRequest(task, buildAction(), 1);
+  }
+
+  public SegmentAllocateAction buildAction()
+  {
+    return new SegmentAllocateAction(
+        dataSource,
+        timestamp,
+        queryGranularity,
+        preferredSegmentGranularity,
+        sequenceName,
+        previousSegmentId,
+        skipSegmentLineageCheck,
+        partialShardSpec,
+        lockGranularity,
+        taskLockType
+    );
+  }
+}
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionTest.java
index a7e85a027e61..c8861a92cd3f 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocateActionTest.java
@@ -20,7 +20,6 @@
 package org.apache.druid.indexing.common.actions;
 
 import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.base.Predicate;
 import com.google.common.collect.FluentIterable;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableSet;
@@ -51,6 +50,7 @@
 import org.easymock.EasyMock;
 import org.joda.time.DateTime;
 import org.joda.time.Period;
+import org.junit.After;
 import org.junit.Assert;
 import org.junit.Before;
 import org.junit.Rule;
@@ -64,6 +64,8 @@
 import java.util.List;
 import java.util.Map;
 import java.util.Map.Entry;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.TimeUnit;
 import java.util.stream.Collectors;
 
 @RunWith(Parameterized.class)
@@ -79,20 +81,26 @@ public class SegmentAllocateActionTest
   private static final DateTime PARTY_TIME = DateTimes.of("1999");
   private static final DateTime THE_DISTANT_FUTURE = DateTimes.of("3000");
 
+  private final boolean useBatch;
   private final LockGranularity lockGranularity;
 
-  @Parameterized.Parameters(name = "{0}")
+  private SegmentAllocationQueue allocationQueue;
+
+  @Parameterized.Parameters(name = "granularity = {0}, useBatch = {1}")
   public static Iterable<Object[]> constructorFeeder()
   {
     return ImmutableList.of(
-        new Object[]{LockGranularity.SEGMENT},
-        new Object[]{LockGranularity.TIME_CHUNK}
+        new Object[]{LockGranularity.SEGMENT, true},
+        new Object[]{LockGranularity.SEGMENT, false},
+        new Object[]{LockGranularity.TIME_CHUNK, true},
+        new Object[]{LockGranularity.TIME_CHUNK, false}
     );
   }
 
-  public SegmentAllocateActionTest(LockGranularity lockGranularity)
+  public SegmentAllocateActionTest(LockGranularity lockGranularity, boolean useBatch)
   {
     this.lockGranularity = lockGranularity;
+    this.useBatch = useBatch;
   }
 
   @Before
@@ -101,6 +109,19 @@ public void setUp()
     ServiceEmitter emitter = EasyMock.createMock(ServiceEmitter.class);
     EmittingLogger.registerEmitter(emitter);
     EasyMock.replay(emitter);
+    allocationQueue = taskActionTestKit.getTaskActionToolbox().getSegmentAllocationQueue();
+    if (allocationQueue != null) {
+      allocationQueue.start();
+      allocationQueue.becomeLeader();
+    }
+  }
+
+  @After
+  public void tearDown()
+  {
+    if (allocationQueue != null) {
+      allocationQueue.stop();
+    }
   }
 
   @Test
@@ -288,29 +309,11 @@ public void testResumeSequence()
     if (lockGranularity == LockGranularity.TIME_CHUNK) {
       final TaskLock partyLock = Iterables.getOnlyElement(
           FluentIterable.from(taskActionTestKit.getTaskLockbox().findLocksForTask(task))
-                        .filter(
-                            new Predicate<TaskLock>()
-                            {
-                              @Override
-                              public boolean apply(TaskLock input)
-                              {
-                                return input.getInterval().contains(PARTY_TIME);
-                              }
-                            }
-                        )
+                        .filter(input -> input.getInterval().contains(PARTY_TIME))
       );
       final TaskLock futureLock = Iterables.getOnlyElement(
           FluentIterable.from(taskActionTestKit.getTaskLockbox().findLocksForTask(task))
-                        .filter(
-                            new Predicate<TaskLock>()
-                            {
-                              @Override
-                              public boolean apply(TaskLock input)
-                              {
-                                return input.getInterval().contains(THE_DISTANT_FUTURE);
-                              }
-                            }
-                        )
+                        .filter(input -> input.getInterval().contains(THE_DISTANT_FUTURE))
       );
 
       assertSameIdentifier(
@@ -446,29 +449,11 @@ public void testMultipleSequences()
     if (lockGranularity == LockGranularity.TIME_CHUNK) {
       final TaskLock partyLock = Iterables.getOnlyElement(
           FluentIterable.from(taskActionTestKit.getTaskLockbox().findLocksForTask(task))
-                        .filter(
-                            new Predicate<TaskLock>()
-                            {
-                              @Override
-                              public boolean apply(TaskLock input)
-                              {
-                                return input.getInterval().contains(PARTY_TIME);
-                              }
-                            }
-                        )
+                        .filter(input -> input.getInterval().contains(PARTY_TIME))
       );
       final TaskLock futureLock = Iterables.getOnlyElement(
           FluentIterable.from(taskActionTestKit.getTaskLockbox().findLocksForTask(task))
-                        .filter(
-                            new Predicate<TaskLock>()
-                            {
-                              @Override
-                              public boolean apply(TaskLock input)
-                              {
-                                return input.getInterval().contains(THE_DISTANT_FUTURE);
-                              }
-                            }
-                        )
+                        .filter(input -> input.getInterval().contains(THE_DISTANT_FUTURE))
       );
 
       assertSameIdentifier(
@@ -990,21 +975,26 @@ private SegmentIdWithShardSpec allocate(
         lockGranularity,
         null
     );
-    return action.perform(task, taskActionTestKit.getTaskActionToolbox());
+
+    try {
+      if (useBatch) {
+        return action.performAsync(task, taskActionTestKit.getTaskActionToolbox())
+                     .get(5, TimeUnit.SECONDS);
+      } else {
+        return action.perform(task, taskActionTestKit.getTaskActionToolbox());
+      }
+    }
+    catch (ExecutionException e) {
+      return null;
+    }
+    catch (Exception e) {
+      throw new RuntimeException(e);
+    }
   }
 
   private void assertSameIdentifier(final SegmentIdWithShardSpec expected, final SegmentIdWithShardSpec actual)
   {
     Assert.assertEquals(expected, actual);
-    Assert.assertEquals(expected.getShardSpec().getPartitionNum(), actual.getShardSpec().getPartitionNum());
-    Assert.assertEquals(expected.getShardSpec().getClass(), actual.getShardSpec().getClass());
-
-    if (expected.getShardSpec().getClass() == NumberedShardSpec.class
-        && actual.getShardSpec().getClass() == NumberedShardSpec.class) {
-      Assert.assertEquals(expected.getShardSpec().getNumCorePartitions(), actual.getShardSpec().getNumCorePartitions());
-    } else if (expected.getShardSpec().getClass() == LinearShardSpec.class
-               && actual.getShardSpec().getClass() == LinearShardSpec.class) {
-      // do nothing
-    }
+    Assert.assertEquals(expected.getShardSpec(), actual.getShardSpec());
   }
 }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocationQueueTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocationQueueTest.java
new file mode 100644
index 000000000000..974b3096f92d
--- /dev/null
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/SegmentAllocationQueueTest.java
@@ -0,0 +1,366 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.common.actions;
+
+import org.apache.druid.indexing.common.LockGranularity;
+import org.apache.druid.indexing.common.TaskLockType;
+import org.apache.druid.indexing.common.task.NoopTask;
+import org.apache.druid.indexing.common.task.Task;
+import org.apache.druid.indexing.overlord.config.TaskLockConfig;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.granularity.Granularities;
+import org.apache.druid.java.util.metrics.StubServiceEmitter;
+import org.apache.druid.segment.realtime.appenderator.SegmentIdWithShardSpec;
+import org.apache.druid.server.coordinator.simulate.BlockingExecutorService;
+import org.apache.druid.server.coordinator.simulate.WrappingScheduledExecutorService;
+import org.junit.After;
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Rule;
+import org.junit.Test;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.Future;
+import java.util.concurrent.TimeUnit;
+import java.util.concurrent.TimeoutException;
+
+public class SegmentAllocationQueueTest
+{
+  @Rule
+  public TaskActionTestKit taskActionTestKit = new TaskActionTestKit();
+
+  private static final String DS_WIKI = "wiki";
+  private static final String DS_KOALA = "koala";
+
+  private SegmentAllocationQueue allocationQueue;
+
+  private StubServiceEmitter emitter;
+  private BlockingExecutorService executor;
+
+  @Before
+  public void setUp()
+  {
+    executor = new BlockingExecutorService("alloc-test-exec");
+    emitter = new StubServiceEmitter("overlord", "alloc-test");
+
+    final TaskLockConfig lockConfig = new TaskLockConfig()
+    {
+      @Override
+      public boolean isBatchSegmentAllocation()
+      {
+        return true;
+      }
+
+      @Override
+      public long getBatchAllocationWaitTime()
+      {
+        return 0;
+      }
+    };
+
+    allocationQueue = new SegmentAllocationQueue(
+        taskActionTestKit.getTaskLockbox(),
+        lockConfig,
+        taskActionTestKit.getMetadataStorageCoordinator(),
+        emitter,
+        (corePoolSize, nameFormat)
+            -> new WrappingScheduledExecutorService(nameFormat, executor, false)
+    );
+    allocationQueue.start();
+    allocationQueue.becomeLeader();
+  }
+
+  @After
+  public void tearDown()
+  {
+    if (allocationQueue != null) {
+      allocationQueue.stop();
+    }
+    if (executor != null) {
+      executor.shutdownNow();
+    }
+    emitter.flush();
+  }
+
+  @Test
+  public void testBatchWithMultipleTimestamps()
+  {
+    verifyAllocationWithBatching(
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .forTimestamp("2022-01-01T01:00:00")
+                         .withSegmentGranularity(Granularities.DAY)
+                         .withQueryGranularity(Granularities.SECOND)
+                         .withLockGranularity(LockGranularity.TIME_CHUNK)
+                         .withSequenceName("seq_1")
+                         .build(),
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .forTimestamp("2022-01-01T02:00:00")
+                         .withSegmentGranularity(Granularities.DAY)
+                         .withQueryGranularity(Granularities.SECOND)
+                         .withLockGranularity(LockGranularity.TIME_CHUNK)
+                         .withSequenceName("seq_2")
+                         .build(),
+        true
+    );
+  }
+
+  @Test
+  public void testBatchWithExclusiveLocks()
+  {
+    verifyAllocationWithBatching(
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withTaskLockType(TaskLockType.EXCLUSIVE).build(),
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withTaskLockType(TaskLockType.EXCLUSIVE).build(),
+        true
+    );
+  }
+
+  @Test
+  public void testBatchWithSharedLocks()
+  {
+    verifyAllocationWithBatching(
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withTaskLockType(TaskLockType.SHARED).build(),
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withTaskLockType(TaskLockType.SHARED).build(),
+        true
+    );
+  }
+
+  @Test
+  public void testBatchWithMultipleQueryGranularities()
+  {
+    verifyAllocationWithBatching(
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withQueryGranularity(Granularities.SECOND).build(),
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withQueryGranularity(Granularities.MINUTE).build(),
+        true
+    );
+  }
+
+  @Test
+  public void testMultipleDatasourcesCannotBatch()
+  {
+    verifyAllocationWithBatching(
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1")).build(),
+        allocateRequest().forTask(createTask(DS_KOALA, "group_1")).build(),
+        false
+    );
+  }
+
+  @Test
+  public void testMultipleGroupIdsCannotBatch()
+  {
+    verifyAllocationWithBatching(
+        allocateRequest().forTask(createTask(DS_WIKI, "group_2")).build(),
+        allocateRequest().forTask(createTask(DS_WIKI, "group_3")).build(),
+        false
+    );
+  }
+
+  @Test
+  public void testMultipleLockGranularitiesCannotBatch()
+  {
+    verifyAllocationWithBatching(
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withLockGranularity(LockGranularity.TIME_CHUNK).build(),
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withLockGranularity(LockGranularity.SEGMENT).build(),
+        false
+    );
+  }
+
+  @Test
+  public void testMultipleAllocateIntervalsCannotBatch()
+  {
+    verifyAllocationWithBatching(
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .forTimestamp("2022-01-01")
+                         .withSegmentGranularity(Granularities.DAY).build(),
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .forTimestamp("2022-01-02")
+                         .withSegmentGranularity(Granularities.DAY).build(),
+        false
+    );
+  }
+
+  @Test
+  public void testConflictingPendingSegment()
+  {
+    SegmentAllocateRequest hourSegmentRequest =
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withSegmentGranularity(Granularities.HOUR)
+                         .build();
+    Future<SegmentIdWithShardSpec> hourSegmentFuture = allocationQueue.add(hourSegmentRequest);
+
+    SegmentAllocateRequest halfHourSegmentRequest =
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1"))
+                         .withSegmentGranularity(Granularities.THIRTY_MINUTE)
+                         .build();
+    Future<SegmentIdWithShardSpec> halfHourSegmentFuture = allocationQueue.add(halfHourSegmentRequest);
+
+    executor.finishNextPendingTask();
+
+    Assert.assertNotNull(getSegmentId(hourSegmentFuture));
+    Throwable t = Assert.assertThrows(ISE.class, () -> getSegmentId(halfHourSegmentFuture));
+    Assert.assertEquals("Storage coordinator could not allocate segment.", t.getMessage());
+  }
+
+  @Test
+  public void testFullAllocationQueue()
+  {
+    for (int i = 0; i < 2000; ++i) {
+      SegmentAllocateRequest request =
+          allocateRequest().forTask(createTask(DS_WIKI, "group_" + i)).build();
+      allocationQueue.add(request);
+    }
+
+    SegmentAllocateRequest request =
+        allocateRequest().forTask(createTask(DS_WIKI, "next_group")).build();
+    Future<SegmentIdWithShardSpec> future = allocationQueue.add(request);
+
+    // Verify that the future is already complete and segment allocation has failed
+    Throwable t = Assert.assertThrows(ISE.class, () -> getSegmentId(future));
+    Assert.assertEquals(
+        "Segment allocation queue is full. Check the metric `task/action/batch/runTime` "
+        + "to determine if metadata operations are slow.",
+        t.getMessage()
+    );
+  }
+
+  @Test
+  public void testMaxBatchSize()
+  {
+    for (int i = 0; i < 500; ++i) {
+      SegmentAllocateRequest request =
+          allocateRequest().forTask(createTask(DS_WIKI, "group_1")).build();
+      allocationQueue.add(request);
+    }
+
+    // Verify that next request is added to a new batch
+    Assert.assertEquals(1, allocationQueue.size());
+    SegmentAllocateRequest request =
+        allocateRequest().forTask(createTask(DS_WIKI, "group_1")).build();
+    allocationQueue.add(request);
+    Assert.assertEquals(2, allocationQueue.size());
+  }
+
+  @Test
+  public void testMultipleRequestsForSameSegment()
+  {
+    final List<Future<SegmentIdWithShardSpec>> segmentFutures = new ArrayList<>();
+    for (int i = 0; i < 10; ++i) {
+      SegmentAllocateRequest request =
+          allocateRequest().forTask(createTask(DS_WIKI, "group_" + i))
+                           .withSequenceName("sequence_1")
+                           .withPreviousSegmentId("segment_1")
+                           .build();
+      segmentFutures.add(allocationQueue.add(request));
+    }
+
+    executor.finishNextPendingTask();
+
+    SegmentIdWithShardSpec segmentId1 = getSegmentId(segmentFutures.get(0));
+
+    for (Future<SegmentIdWithShardSpec> future : segmentFutures) {
+      Assert.assertEquals(getSegmentId(future), segmentId1);
+    }
+  }
+
+  @Test
+  public void testMaxWaitTime()
+  {
+    // Verify that the batch is due yet
+  }
+
+  @Test
+  public void testRequestsFailOnLeaderChange()
+  {
+    final List<Future<SegmentIdWithShardSpec>> segmentFutures = new ArrayList<>();
+    for (int i = 0; i < 10; ++i) {
+      SegmentAllocateRequest request =
+          allocateRequest().forTask(createTask(DS_WIKI, "group_" + i)).build();
+      segmentFutures.add(allocationQueue.add(request));
+    }
+
+    allocationQueue.stopBeingLeader();
+    executor.finishNextPendingTask();
+
+    for (Future<SegmentIdWithShardSpec> future : segmentFutures) {
+      Throwable t = Assert.assertThrows(ISE.class, () -> getSegmentId(future));
+      Assert.assertEquals("Cannot allocate segment if not leader", t.getMessage());
+    }
+  }
+
+  private void verifyAllocationWithBatching(
+      SegmentAllocateRequest a,
+      SegmentAllocateRequest b,
+      boolean canBatch
+  )
+  {
+    Assert.assertEquals(0, allocationQueue.size());
+    final Future<SegmentIdWithShardSpec> futureA = allocationQueue.add(a);
+    final Future<SegmentIdWithShardSpec> futureB = allocationQueue.add(b);
+
+    final int expectedCount = canBatch ? 1 : 2;
+    Assert.assertEquals(expectedCount, allocationQueue.size());
+
+    executor.finishNextPendingTask();
+    emitter.verifyEmitted("task/action/batch/size", expectedCount);
+
+    Assert.assertNotNull(getSegmentId(futureA));
+    Assert.assertNotNull(getSegmentId(futureB));
+  }
+
+  private SegmentIdWithShardSpec getSegmentId(Future<SegmentIdWithShardSpec> future)
+  {
+    try {
+      return future.get(5, TimeUnit.SECONDS);
+    }
+    catch (ExecutionException e) {
+      throw new ISE(e.getCause().getMessage());
+    }
+    catch (InterruptedException | TimeoutException e) {
+      throw new RuntimeException(e);
+    }
+  }
+
+  private SegmentAllocateActionBuilder allocateRequest()
+  {
+    return new SegmentAllocateActionBuilder()
+        .forDatasource(DS_WIKI)
+        .forTimestamp("2022-01-01")
+        .withLockGranularity(LockGranularity.TIME_CHUNK)
+        .withTaskLockType(TaskLockType.SHARED)
+        .withQueryGranularity(Granularities.SECOND)
+        .withSegmentGranularity(Granularities.HOUR);
+  }
+
+  private Task createTask(String datasource, String groupId)
+  {
+    Task task = new NoopTask(null, groupId, datasource, 0, 0, null, null, null);
+    taskActionTestKit.getTaskLockbox().add(task);
+    return task;
+  }
+}
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/TaskActionTestKit.java b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/TaskActionTestKit.java
index 2d6b22732a69..eebf78a7ddcb 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/TaskActionTestKit.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/common/actions/TaskActionTestKit.java
@@ -27,7 +27,10 @@
 import org.apache.druid.indexing.overlord.IndexerMetadataStorageCoordinator;
 import org.apache.druid.indexing.overlord.TaskLockbox;
 import org.apache.druid.indexing.overlord.TaskStorage;
+import org.apache.druid.indexing.overlord.config.TaskLockConfig;
 import org.apache.druid.indexing.overlord.supervisor.SupervisorManager;
+import org.apache.druid.java.util.common.concurrent.ScheduledExecutors;
+import org.apache.druid.java.util.emitter.service.ServiceEmitter;
 import org.apache.druid.metadata.IndexerSQLMetadataStorageCoordinator;
 import org.apache.druid.metadata.MetadataStorageConnectorConfig;
 import org.apache.druid.metadata.MetadataStorageTablesConfig;
@@ -99,11 +102,34 @@ public int getSqlMetadataMaxRetry()
         Suppliers.ofInstance(metadataStorageTablesConfig),
         testDerbyConnector
     );
+    final ServiceEmitter noopEmitter = new NoopServiceEmitter();
+    final TaskLockConfig taskLockConfig = new TaskLockConfig()
+    {
+      @Override
+      public boolean isBatchSegmentAllocation()
+      {
+        return true;
+      }
+
+      @Override
+      public long getBatchAllocationWaitTime()
+      {
+        return 10L;
+      }
+    };
+
     taskActionToolbox = new TaskActionToolbox(
         taskLockbox,
         taskStorage,
         metadataStorageCoordinator,
-        new NoopServiceEmitter(),
+        new SegmentAllocationQueue(
+            taskLockbox,
+            taskLockConfig,
+            metadataStorageCoordinator,
+            noopEmitter,
+            ScheduledExecutors::fixed
+        ),
+        noopEmitter,
         EasyMock.createMock(SupervisorManager.class),
         objectMapper
     );
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/input/DruidSegmentInputFormatTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/input/DruidSegmentInputFormatTest.java
index 910371a56699..e4faea1c069c 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/input/DruidSegmentInputFormatTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/input/DruidSegmentInputFormatTest.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.indexing.input;
 
+import com.google.common.collect.ImmutableList;
 import org.apache.druid.data.input.ColumnsFilter;
 import org.apache.druid.data.input.InputEntityReader;
 import org.apache.druid.data.input.InputRowSchema;
@@ -50,7 +51,7 @@ public void testDruidSegmentInputEntityReader()
     DruidSegmentInputFormat format = new DruidSegmentInputFormat(null, null);
     InputEntityReader reader = format.createReader(
         INPUT_ROW_SCHEMA,
-        DruidSegmentReaderTest.makeInputEntity(Intervals.of("2000/P1D"), null),
+        DruidSegmentReaderTest.makeInputEntity(Intervals.of("2000/P1D"), null, ImmutableList.of("s", "d"), ImmutableList.of("cnt", "met_s")),
         null
     );
     Assert.assertTrue(reader instanceof DruidSegmentReader);
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/input/DruidSegmentReaderTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/input/DruidSegmentReaderTest.java
index 1638e79e9a70..ff4b50cee481 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/input/DruidSegmentReaderTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/input/DruidSegmentReaderTest.java
@@ -31,6 +31,7 @@
 import org.apache.druid.data.input.impl.DimensionsSpec;
 import org.apache.druid.data.input.impl.DoubleDimensionSchema;
 import org.apache.druid.data.input.impl.FileEntity;
+import org.apache.druid.data.input.impl.LongDimensionSchema;
 import org.apache.druid.data.input.impl.StringDimensionSchema;
 import org.apache.druid.data.input.impl.TimestampSpec;
 import org.apache.druid.hll.HyperLogLogCollector;
@@ -41,8 +42,11 @@
 import org.apache.druid.java.util.common.guava.BaseSequence.IteratorMaker;
 import org.apache.druid.java.util.common.guava.Sequence;
 import org.apache.druid.java.util.common.parsers.CloseableIterator;
+import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.aggregation.CountAggregatorFactory;
 import org.apache.druid.query.aggregation.hyperloglog.HyperUniquesAggregatorFactory;
+import org.apache.druid.query.filter.NotDimFilter;
+import org.apache.druid.query.filter.OrDimFilter;
 import org.apache.druid.query.filter.SelectorDimFilter;
 import org.apache.druid.segment.IndexBuilder;
 import org.apache.druid.segment.IndexIO;
@@ -80,67 +84,44 @@ public class DruidSegmentReaderTest extends NullHandlingTest
   private File segmentDirectory;
 
   private final IndexIO indexIO = TestHelper.getTestIndexIO();
+  private DimensionsSpec dimensionsSpec;
+  private List<AggregatorFactory> metrics;
+  private List<InputRow> rows;
 
   @Before
   public void setUp() throws IOException
   {
     // Write a segment with two rows in it, with columns: s (string), d (double), cnt (long), met_s (complex).
-    final IncrementalIndex incrementalIndex =
-        IndexBuilder.create()
-                    .schema(
-                        new IncrementalIndexSchema.Builder()
-                            .withDimensionsSpec(
-                                new DimensionsSpec(
-                                    ImmutableList.of(
-                                        StringDimensionSchema.create("s"),
-                                        new DoubleDimensionSchema("d")
-                                    )
-                                )
-                            )
-                            .withMetrics(
-                                new CountAggregatorFactory("cnt"),
-                                new HyperUniquesAggregatorFactory("met_s", "s")
-                            )
-                            .withRollup(false)
-                            .build()
-                    )
-                    .rows(
-                        ImmutableList.of(
-                            new MapBasedInputRow(
-                                DateTimes.of("2000"),
-                                ImmutableList.of("s", "d"),
-                                ImmutableMap.<String, Object>builder()
-                                    .put("s", "foo")
-                                    .put("d", 1.23)
-                                    .build()
-                            ),
-                            new MapBasedInputRow(
-                                DateTimes.of("2000T01"),
-                                ImmutableList.of("s", "d"),
-                                ImmutableMap.<String, Object>builder()
-                                    .put("s", "bar")
-                                    .put("d", 4.56)
-                                    .build()
-                            )
-                        )
-                    )
-                    .buildIncrementalIndex();
-
-    segmentDirectory = temporaryFolder.newFolder();
+    dimensionsSpec = new DimensionsSpec(
+        ImmutableList.of(
+            StringDimensionSchema.create("strCol"),
+            new DoubleDimensionSchema("dblCol")
+        )
+    );
+    metrics = ImmutableList.of(
+        new CountAggregatorFactory("cnt"),
+        new HyperUniquesAggregatorFactory("met_s", "strCol")
+    );
+    rows = ImmutableList.of(
+        new MapBasedInputRow(
+            DateTimes.of("2000"),
+            ImmutableList.of("strCol", "dblCol"),
+            ImmutableMap.<String, Object>builder()
+                .put("strCol", "foo")
+                .put("dblCol", 1.23)
+                .build()
+        ),
+        new MapBasedInputRow(
+            DateTimes.of("2000T01"),
+            ImmutableList.of("strCol", "dblCol"),
+            ImmutableMap.<String, Object>builder()
+                .put("strCol", "bar")
+                .put("dblCol", 4.56)
+                .build()
+        )
+    );
 
-    try {
-      TestHelper.getTestIndexMergerV9(
-          OnHeapMemorySegmentWriteOutMediumFactory.instance()
-      ).persist(
-          incrementalIndex,
-          segmentDirectory,
-          new IndexSpec(),
-          null
-      );
-    }
-    finally {
-      incrementalIndex.close();
-    }
+    createTestSetup();
   }
 
   @Test
@@ -152,8 +133,8 @@ public void testReader() throws IOException
         new TimestampSpec("__time", "millis", DateTimes.of("1971")),
         new DimensionsSpec(
             ImmutableList.of(
-                StringDimensionSchema.create("s"),
-                new DoubleDimensionSchema("d")
+                StringDimensionSchema.create("strCol"),
+                new DoubleDimensionSchema("dblCol")
             )
         ),
         ColumnsFilter.all(),
@@ -165,22 +146,22 @@ public void testReader() throws IOException
         ImmutableList.of(
             new MapBasedInputRow(
                 DateTimes.of("2000"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T").getMillis())
-                    .put("s", "foo")
-                    .put("d", 1.23d)
+                    .put("strCol", "foo")
+                    .put("dblCol", 1.23d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("foo"))
                     .build()
             ),
             new MapBasedInputRow(
                 DateTimes.of("2000T01"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T01").getMillis())
-                    .put("s", "bar")
-                    .put("d", 4.56d)
+                    .put("strCol", "bar")
+                    .put("dblCol", 4.56d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("bar"))
                     .build()
@@ -190,6 +171,74 @@ public void testReader() throws IOException
     );
   }
 
+  @Test
+  public void testReaderWhenFilteringOnLongColumn() throws IOException
+  {
+    dimensionsSpec = new DimensionsSpec(
+        ImmutableList.of(
+            new LongDimensionSchema("longCol"),
+            StringDimensionSchema.create("a"),
+            StringDimensionSchema.create("b")
+        )
+    );
+    metrics = ImmutableList.of();
+
+    List<String> columnNames = ImmutableList.of("longCol", "a", "b");
+    rows = ImmutableList.of(
+        new MapBasedInputRow(
+            DateTimes.utc(1667115726217L),
+            columnNames,
+            ImmutableMap.<String, Object>builder()
+                .put("__time", 1667115726217L)
+                .put("longCol", 0L)
+                .put("a", "foo1")
+                .put("b", "bar1")
+                .build()
+        ),
+        new MapBasedInputRow(
+            DateTimes.utc(1667115726224L),
+           columnNames,
+            ImmutableMap.<String, Object>builder()
+                .put("__time", 1667115726224L)
+                .put("longCol", 0L)
+                .put("a", "foo2")
+                .put("b", "bar2")
+                .build()
+        ),
+        new MapBasedInputRow(
+            DateTimes.utc(1667115726128L),
+            columnNames,
+            ImmutableMap.<String, Object>builder()
+                .put("__time", 1667115726128L)
+                .put("longCol", 5L)
+                .put("a", "foo3")
+                .put("b", "bar3")
+                .build()
+        )
+    );
+
+    createTestSetup();
+
+    final DruidSegmentReader reader = new DruidSegmentReader(
+        makeInputEntityWithParams(Intervals.of("2022-10-30/2022-10-31"), columnNames, null),
+        indexIO,
+        new TimestampSpec("__time", "iso", null),
+        dimensionsSpec,
+        ColumnsFilter.all(),
+        new OrDimFilter(
+            new SelectorDimFilter("longCol", "5", null),
+            new NotDimFilter(new SelectorDimFilter("a", "foo1", null)),
+            new NotDimFilter(new SelectorDimFilter("b", "bar1", null))
+        ),
+        temporaryFolder.newFolder()
+    );
+
+    List<InputRow> expectedRows = new ArrayList<>();
+    expectedRows.add(rows.get(2));
+    expectedRows.add(rows.get(1));
+    Assert.assertEquals(expectedRows, readRows(reader));
+  }
+
   @Test
   public void testDruidTombstoneSegmentReader() throws IOException
   {
@@ -235,8 +284,8 @@ public void testReaderAutoTimestampFormat() throws IOException
         new TimestampSpec("__time", "auto", DateTimes.of("1971")),
         new DimensionsSpec(
             ImmutableList.of(
-                StringDimensionSchema.create("s"),
-                new DoubleDimensionSchema("d")
+                StringDimensionSchema.create("strCol"),
+                new DoubleDimensionSchema("dblCol")
             )
         ),
         ColumnsFilter.all(),
@@ -248,22 +297,22 @@ public void testReaderAutoTimestampFormat() throws IOException
         ImmutableList.of(
             new MapBasedInputRow(
                 DateTimes.of("2000"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T").getMillis())
-                    .put("s", "foo")
-                    .put("d", 1.23d)
+                    .put("strCol", "foo")
+                    .put("dblCol", 1.23d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("foo"))
                     .build()
             ),
             new MapBasedInputRow(
                 DateTimes.of("2000T01"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T01").getMillis())
-                    .put("s", "bar")
-                    .put("d", 4.56d)
+                    .put("strCol", "bar")
+                    .put("dblCol", 4.56d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("bar"))
                     .build()
@@ -280,7 +329,7 @@ public void testReaderWithDimensionExclusions() throws IOException
         makeInputEntity(Intervals.of("2000/P1D")),
         indexIO,
         new TimestampSpec("__time", "millis", DateTimes.of("1971")),
-        DimensionsSpec.builder().setDimensionExclusions(ImmutableList.of("__time", "s", "cnt", "met_s")).build(),
+        DimensionsSpec.builder().setDimensionExclusions(ImmutableList.of("__time", "strCol", "cnt", "met_s")).build(),
         ColumnsFilter.all(),
         null,
         temporaryFolder.newFolder()
@@ -290,22 +339,22 @@ public void testReaderWithDimensionExclusions() throws IOException
         ImmutableList.of(
             new MapBasedInputRow(
                 DateTimes.of("2000"),
-                ImmutableList.of("d"),
+                ImmutableList.of("dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T").getMillis())
-                    .put("s", "foo")
-                    .put("d", 1.23d)
+                    .put("strCol", "foo")
+                    .put("dblCol", 1.23d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("foo"))
                     .build()
             ),
             new MapBasedInputRow(
                 DateTimes.of("2000T01"),
-                ImmutableList.of("d"),
+                ImmutableList.of("dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T01").getMillis())
-                    .put("s", "bar")
-                    .put("d", 4.56d)
+                    .put("strCol", "bar")
+                    .put("dblCol", 4.56d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("bar"))
                     .build()
@@ -324,11 +373,11 @@ public void testReaderWithInclusiveColumnsFilter() throws IOException
         new TimestampSpec("__time", "millis", DateTimes.of("1971")),
         new DimensionsSpec(
             ImmutableList.of(
-                StringDimensionSchema.create("s"),
-                new DoubleDimensionSchema("d")
+                StringDimensionSchema.create("strCol"),
+                new DoubleDimensionSchema("dblCol")
             )
         ),
-        ColumnsFilter.inclusionBased(ImmutableSet.of("__time", "s", "d")),
+        ColumnsFilter.inclusionBased(ImmutableSet.of("__time", "strCol", "dblCol")),
         null,
         temporaryFolder.newFolder()
     );
@@ -337,20 +386,20 @@ public void testReaderWithInclusiveColumnsFilter() throws IOException
         ImmutableList.of(
             new MapBasedInputRow(
                 DateTimes.of("2000"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T").getMillis())
-                    .put("s", "foo")
-                    .put("d", 1.23d)
+                    .put("strCol", "foo")
+                    .put("dblCol", 1.23d)
                     .build()
             ),
             new MapBasedInputRow(
                 DateTimes.of("2000T01"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T01").getMillis())
-                    .put("s", "bar")
-                    .put("d", 4.56d)
+                    .put("strCol", "bar")
+                    .put("dblCol", 4.56d)
                     .build()
             )
         ),
@@ -367,11 +416,11 @@ public void testReaderWithInclusiveColumnsFilterNoTimestamp() throws IOException
         new TimestampSpec("__time", "millis", DateTimes.of("1971")),
         new DimensionsSpec(
             ImmutableList.of(
-                StringDimensionSchema.create("s"),
-                new DoubleDimensionSchema("d")
+                StringDimensionSchema.create("strCol"),
+                new DoubleDimensionSchema("dblCol")
             )
         ),
-        ColumnsFilter.inclusionBased(ImmutableSet.of("s", "d")),
+        ColumnsFilter.inclusionBased(ImmutableSet.of("strCol", "dblCol")),
         null,
         temporaryFolder.newFolder()
     );
@@ -380,18 +429,18 @@ public void testReaderWithInclusiveColumnsFilterNoTimestamp() throws IOException
         ImmutableList.of(
             new MapBasedInputRow(
                 DateTimes.of("1971"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
-                    .put("s", "foo")
-                    .put("d", 1.23d)
+                    .put("strCol", "foo")
+                    .put("dblCol", 1.23d)
                     .build()
             ),
             new MapBasedInputRow(
                 DateTimes.of("1971"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
-                    .put("s", "bar")
-                    .put("d", 4.56d)
+                    .put("strCol", "bar")
+                    .put("dblCol", 4.56d)
                     .build()
             )
         ),
@@ -408,12 +457,12 @@ public void testReaderWithFilter() throws IOException
         new TimestampSpec("__time", "millis", DateTimes.of("1971")),
         new DimensionsSpec(
             ImmutableList.of(
-                StringDimensionSchema.create("s"),
-                new DoubleDimensionSchema("d")
+                StringDimensionSchema.create("strCol"),
+                new DoubleDimensionSchema("dblCol")
             )
         ),
         ColumnsFilter.all(),
-        new SelectorDimFilter("d", "1.23", null),
+        new SelectorDimFilter("dblCol", "1.23", null),
         temporaryFolder.newFolder()
     );
 
@@ -421,11 +470,11 @@ public void testReaderWithFilter() throws IOException
         ImmutableList.of(
             new MapBasedInputRow(
                 DateTimes.of("2000"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T").getMillis())
-                    .put("s", "foo")
-                    .put("d", 1.23d)
+                    .put("strCol", "foo")
+                    .put("dblCol", 1.23d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("foo"))
                     .build()
@@ -441,11 +490,11 @@ public void testReaderTimestampFromDouble() throws IOException
     final DruidSegmentReader reader = new DruidSegmentReader(
         makeInputEntity(Intervals.of("2000/P1D")),
         indexIO,
-        new TimestampSpec("d", "posix", null),
+        new TimestampSpec("dblCol", "posix", null),
         new DimensionsSpec(
             ImmutableList.of(
-                StringDimensionSchema.create("s"),
-                new DoubleDimensionSchema("d")
+                StringDimensionSchema.create("strCol"),
+                new DoubleDimensionSchema("dblCol")
             )
         ),
         ColumnsFilter.all(),
@@ -457,22 +506,22 @@ public void testReaderTimestampFromDouble() throws IOException
         ImmutableList.of(
             new MapBasedInputRow(
                 DateTimes.of("1970-01-01T00:00:01.000Z"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T").getMillis())
-                    .put("s", "foo")
-                    .put("d", 1.23d)
+                    .put("strCol", "foo")
+                    .put("dblCol", 1.23d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("foo"))
                     .build()
             ),
             new MapBasedInputRow(
                 DateTimes.of("1970-01-01T00:00:04.000Z"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T01").getMillis())
-                    .put("s", "bar")
-                    .put("d", 4.56d)
+                    .put("strCol", "bar")
+                    .put("dblCol", 4.56d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("bar"))
                     .build()
@@ -491,8 +540,8 @@ public void testReaderTimestampAsPosixIncorrectly() throws IOException
         new TimestampSpec("__time", "posix", null),
         new DimensionsSpec(
             ImmutableList.of(
-                StringDimensionSchema.create("s"),
-                new DoubleDimensionSchema("d")
+                StringDimensionSchema.create("strCol"),
+                new DoubleDimensionSchema("dblCol")
             )
         ),
         ColumnsFilter.all(),
@@ -504,22 +553,22 @@ public void testReaderTimestampAsPosixIncorrectly() throws IOException
         ImmutableList.of(
             new MapBasedInputRow(
                 DateTimes.of("31969-04-01T00:00:00.000Z"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T").getMillis())
-                    .put("s", "foo")
-                    .put("d", 1.23d)
+                    .put("strCol", "foo")
+                    .put("dblCol", 1.23d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("foo"))
                     .build()
             ),
             new MapBasedInputRow(
                 DateTimes.of("31969-05-12T16:00:00.000Z"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T01").getMillis())
-                    .put("s", "bar")
-                    .put("d", 4.56d)
+                    .put("strCol", "bar")
+                    .put("dblCol", 4.56d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("bar"))
                     .build()
@@ -538,8 +587,8 @@ public void testReaderTimestampSpecDefault() throws IOException
         new TimestampSpec(null, null, DateTimes.of("1971")),
         new DimensionsSpec(
             ImmutableList.of(
-                StringDimensionSchema.create("s"),
-                new DoubleDimensionSchema("d")
+                StringDimensionSchema.create("strCol"),
+                new DoubleDimensionSchema("dblCol")
             )
         ),
         ColumnsFilter.all(),
@@ -551,22 +600,22 @@ public void testReaderTimestampSpecDefault() throws IOException
         ImmutableList.of(
             new MapBasedInputRow(
                 DateTimes.of("1971"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T").getMillis())
-                    .put("s", "foo")
-                    .put("d", 1.23d)
+                    .put("strCol", "foo")
+                    .put("dblCol", 1.23d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("foo"))
                     .build()
             ),
             new MapBasedInputRow(
                 DateTimes.of("1971"),
-                ImmutableList.of("s", "d"),
+                ImmutableList.of("strCol", "dblCol"),
                 ImmutableMap.<String, Object>builder()
                     .put("__time", DateTimes.of("2000T01").getMillis())
-                    .put("s", "bar")
-                    .put("d", 4.56d)
+                    .put("strCol", "bar")
+                    .put("dblCol", 4.56d)
                     .put("cnt", 1L)
                     .put("met_s", makeHLLC("bar"))
                     .build()
@@ -623,10 +672,20 @@ public void close()
 
   private DruidSegmentInputEntity makeInputEntity(final Interval interval)
   {
-    return makeInputEntity(interval, segmentDirectory);
+    return makeInputEntity(interval, segmentDirectory, ImmutableList.of("strCol", "dblCol"), ImmutableList.of("cnt", "met_s"));
+  }
+
+  private DruidSegmentInputEntity makeInputEntityWithParams(final Interval interval, final List<String> dimensions, final List<String> metrics)
+  {
+    return makeInputEntity(interval, segmentDirectory, dimensions, metrics);
   }
 
-  public static DruidSegmentInputEntity makeInputEntity(final Interval interval, final File segmentDirectory)
+  public static DruidSegmentInputEntity makeInputEntity(
+      final Interval interval,
+      final File segmentDirectory,
+      final List<String> dimensions,
+      final List<String> metrics
+  )
   {
     return new DruidSegmentInputEntity(
         new SegmentCacheManager()
@@ -669,9 +728,9 @@ public void loadSegmentIntoPageCache(DataSegment segment, ExecutorService exec)
         },
         DataSegment.builder()
                    .dataSource("ds")
-                   .dimensions(ImmutableList.of("s", "d"))
-                   .metrics(ImmutableList.of("cnt", "met_s"))
-                   .interval(Intervals.of("2000/P1D"))
+                   .dimensions(dimensions)
+                   .metrics(metrics)
+                   .interval(interval)
                    .version("1")
                    .size(0)
                    .build(),
@@ -765,4 +824,36 @@ private static HyperLogLogCollector makeHLLC(final String... values)
     }
     return collector;
   }
+
+  private void createTestSetup() throws IOException
+  {
+    final IncrementalIndex incrementalIndex =
+        IndexBuilder.create()
+                    .schema(
+                        new IncrementalIndexSchema.Builder()
+                            .withDimensionsSpec(dimensionsSpec)
+                            .withMetrics(metrics.toArray(new AggregatorFactory[0]))
+                            .withRollup(false)
+                            .build()
+                    )
+                    .rows(rows)
+                    .buildIncrementalIndex();
+
+    segmentDirectory = temporaryFolder.newFolder();
+
+    try {
+      TestHelper.getTestIndexMergerV9(
+          OnHeapMemorySegmentWriteOutMediumFactory.instance()
+      ).persist(
+          incrementalIndex,
+          segmentDirectory,
+          new IndexSpec(),
+          null
+      );
+    }
+    finally {
+      incrementalIndex.close();
+    }
+  }
+
 }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/overlord/http/OverlordTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/overlord/http/OverlordTest.java
index 6f9a01c25b0b..3ada645ff88a 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/overlord/http/OverlordTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/overlord/http/OverlordTest.java
@@ -40,6 +40,7 @@
 import org.apache.druid.indexer.TaskStatusPlus;
 import org.apache.druid.indexing.common.TaskLock;
 import org.apache.druid.indexing.common.TimeChunkLock;
+import org.apache.druid.indexing.common.actions.SegmentAllocationQueue;
 import org.apache.druid.indexing.common.actions.TaskActionClientFactory;
 import org.apache.druid.indexing.common.config.TaskStorageConfig;
 import org.apache.druid.indexing.common.task.NoopTask;
@@ -226,7 +227,8 @@ public MockTaskRunner get()
         serviceEmitter,
         supervisorManager,
         EasyMock.createNiceMock(OverlordHelperManager.class),
-        new TestDruidLeaderSelector()
+        new TestDruidLeaderSelector(),
+        EasyMock.createNiceMock(SegmentAllocationQueue.class)
     );
     EmittingLogger.registerEmitter(serviceEmitter);
   }
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisorStateTest.java b/indexing-service/src/test/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisorStateTest.java
index ab3f9c5f9f1f..61260221bbee 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisorStateTest.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/seekablestream/supervisor/SeekableStreamSupervisorStateTest.java
@@ -331,6 +331,7 @@ public void testConnectingToStreamFailRecoveryFailRecovery() throws Exception
     EasyMock.expect(recordSupplier.getPartitionIds(STREAM)).andReturn(ImmutableSet.of(SHARD_ID)).times(3);
     EasyMock.expect(taskStorage.getActiveTasksByDatasource(DATASOURCE)).andReturn(ImmutableList.of()).anyTimes();
     EasyMock.expect(taskQueue.add(EasyMock.anyObject())).andReturn(true).anyTimes();
+    EasyMock.expect(taskRunner.getRunningTasks()).andReturn(ImmutableList.of()).anyTimes();
 
     replayAll();
 
@@ -564,6 +565,7 @@ public void testCreatingTasksFailRecoveryFail() throws Exception
     EasyMock.expect(taskQueue.add(EasyMock.anyObject())).andThrow(new IllegalStateException(EXCEPTION_MSG)).times(3);
     EasyMock.expect(taskQueue.add(EasyMock.anyObject())).andReturn(true).times(3);
     EasyMock.expect(taskQueue.add(EasyMock.anyObject())).andThrow(new IllegalStateException(EXCEPTION_MSG)).times(3);
+    EasyMock.expect(taskRunner.getRunningTasks()).andReturn(ImmutableList.of()).anyTimes();
 
     replayAll();
 
diff --git a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
index 2dcff7694678..d64bd1d22263 100644
--- a/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
+++ b/indexing-service/src/test/java/org/apache/druid/indexing/test/TestIndexerMetadataStorageCoordinator.java
@@ -25,6 +25,7 @@
 import com.google.common.collect.Sets;
 import org.apache.druid.indexing.overlord.DataSourceMetadata;
 import org.apache.druid.indexing.overlord.IndexerMetadataStorageCoordinator;
+import org.apache.druid.indexing.overlord.SegmentCreateRequest;
 import org.apache.druid.indexing.overlord.SegmentPublishResult;
 import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.jackson.DefaultObjectMapper;
@@ -36,8 +37,10 @@
 
 import javax.annotation.Nullable;
 import java.util.ArrayList;
+import java.util.Collections;
 import java.util.HashSet;
 import java.util.List;
+import java.util.Map;
 import java.util.Set;
 
 public class TestIndexerMetadataStorageCoordinator implements IndexerMetadataStorageCoordinator
@@ -124,6 +127,17 @@ public Set<DataSegment> announceHistoricalSegments(Set<DataSegment> segments)
     return ImmutableSet.copyOf(added);
   }
 
+  @Override
+  public Map<SegmentCreateRequest, SegmentIdWithShardSpec> allocatePendingSegments(
+      String dataSource,
+      Interval interval,
+      boolean skipSegmentLineageCheck,
+      List<SegmentCreateRequest> requests
+  )
+  {
+    return Collections.emptyMap();
+  }
+
   @Override
   public SegmentPublishResult announceHistoricalSegments(
       Set<DataSegment> segments,
diff --git a/integration-tests-ex/README.md b/integration-tests-ex/README.md
index 9c29ec101fe9..3a17c6e7c700 100644
--- a/integration-tests-ex/README.md
+++ b/integration-tests-ex/README.md
@@ -71,7 +71,7 @@ Start the cluster:
 
 ```bash
 cd $DRUID_DEV/integration-tests-ex/cases
-./cluster.sh <category> up
+./cluster.sh up <category>
 ```
 
 Where `<category>` is one of the test categories. Then launch the
diff --git a/integration-tests-ex/cases/pom.xml b/integration-tests-ex/cases/pom.xml
index cf781f6f8885..57fa522974cc 100644
--- a/integration-tests-ex/cases/pom.xml
+++ b/integration-tests-ex/cases/pom.xml
@@ -31,7 +31,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
@@ -178,6 +178,11 @@
                 </exclusion>
             </exclusions>
         </dependency>
+        <dependency>
+            <groupId>org.apache.druid</groupId>
+            <artifactId>druid-sql</artifactId>
+            <version>${project.parent.version}</version>
+        </dependency>
         <dependency>
             <groupId>org.apache.druid.extensions</groupId>
             <artifactId>druid-multi-stage-query</artifactId>
diff --git a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/AbstractITSQLBasedIngestion.java b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/AbstractITSQLBasedIngestion.java
index 4bb1cdc4783b..66df19864796 100644
--- a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/AbstractITSQLBasedIngestion.java
+++ b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/AbstractITSQLBasedIngestion.java
@@ -28,6 +28,9 @@
 import org.apache.druid.testing.utils.MsqTestQueryHelper;
 import org.apache.druid.testing.utils.TestQueryHelper;
 import org.apache.druid.testsEx.indexer.AbstractITBatchIndexTest;
+import org.junit.Rule;
+import org.junit.rules.TestWatcher;
+import org.junit.runner.Description;
 
 import java.io.IOException;
 import java.io.InputStream;
@@ -36,6 +39,9 @@
 
 public class AbstractITSQLBasedIngestion
 {
+  String DATASOURCE_STRING_IN_TASK = "%%DATASOURCE%%";
+  String REINDEX_DATASOURCE_STRING_IN_TASK = "%%REINDEX_DATASOURCE%%";
+
   public static final Logger LOG = new Logger(TestQueryHelper.class);
   @Inject
   private MsqTestQueryHelper msqHelper;
@@ -46,6 +52,28 @@ public class AbstractITSQLBasedIngestion
   @Inject
   private DataLoaderHelper dataLoaderHelper;
 
+  @Rule
+  public TestWatcher watchman = new TestWatcher()
+  {
+    @Override
+    public void starting(Description d)
+    {
+      LOG.info("RUNNING %s", d.getDisplayName());
+    }
+
+    @Override
+    public void failed(Throwable e, Description d)
+    {
+      LOG.error("FAILED %s", d.getDisplayName());
+    }
+
+    @Override
+    public void finished(Description d)
+    {
+      LOG.info("FINISHED %s", d.getDisplayName());
+    }
+  };
+
   /**
    * Reads file as utf-8 string and replace %%DATASOURCE%% with the provide datasource value.
    */
@@ -62,7 +90,7 @@ protected String getStringFromFileAndReplaceDatasource(String filePath, String d
 
     fileString = StringUtils.replace(
         fileString,
-        "%%DATASOURCE%%",
+        DATASOURCE_STRING_IN_TASK,
         datasource
     );
 
@@ -85,10 +113,9 @@ protected void doTestQuery(String queryFilePath, String dataSource)
   }
 
   /**
-   * Sumits a sqlTask, waits for task completion and then runs test queries on ingested datasource.
+   * Sumits a sqlTask, waits for task completion.
    */
-  protected void submitTaskAnddoTestQuery(String sqlTask, String queryFilePath, String datasource,
-                                          Map<String, Object> msqContext) throws Exception
+  protected void submitTask(String sqlTask, String datasource, Map<String, Object> msqContext) throws Exception
   {
     LOG.info("SqlTask - \n %s", sqlTask);
 
@@ -99,23 +126,55 @@ protected void submitTaskAnddoTestQuery(String sqlTask, String queryFilePath, St
     );
 
     dataLoaderHelper.waitUntilDatasourceIsReady(datasource);
-    doTestQuery(queryFilePath, datasource);
   }
 
   /**
-   * Runs a MSQ ingest sql test.
+   * Sumits a sqlTask, waits for task completion.
+   */
+  protected void submitTaskFromFile(String sqlFilePath, String datasource, Map<String, Object> msqContext) throws Exception
+  {
+    String sqlTask = getStringFromFileAndReplaceDatasource(sqlFilePath, datasource);
+    submitTask(sqlTask, datasource, msqContext);
+  }
+
+  /**
+   * Runs a SQL ingest test.
    *
    * @param  sqlFilePath path of file containing the sql query.
    * @param  queryFilePath path of file containing the native test queries to be run on the ingested datasource.
    * @param  datasource name of the datasource. %%DATASOURCE%% in the sql and queries will be replaced with this value.
    * @param  msqContext context parameters to be passed with MSQ API call.
    */
-  protected void runMSQTaskandTestQueries(String sqlFilePath, String queryFilePath, String datasource,
+  protected void runMSQTaskandTestQueries(String sqlFilePath,
+                                          String queryFilePath,
+                                          String datasource,
                                           Map<String, Object> msqContext) throws Exception
   {
     LOG.info("Starting MSQ test for [%s, %s]", sqlFilePath, queryFilePath);
 
+    submitTaskFromFile(sqlFilePath, datasource, msqContext);
+    doTestQuery(queryFilePath, datasource);
+  }
+
+  /**
+   * Runs a reindex SQL ingest test.
+   * Same as runMSQTaskandTestQueries, but replaces both %%DATASOURCE%% and %%REINDEX_DATASOURCE%% in the SQL Task.
+   */
+  protected void runReindexMSQTaskandTestQueries(String sqlFilePath,
+                                                 String queryFilePath,
+                                                 String datasource,
+                                                 String reindexDatasource,
+                                                 Map<String, Object> msqContext) throws Exception
+  {
+    LOG.info("Starting Reindex MSQ test for [%s, %s]", sqlFilePath, queryFilePath);
+
     String sqlTask = getStringFromFileAndReplaceDatasource(sqlFilePath, datasource);
-    submitTaskAnddoTestQuery(sqlTask, queryFilePath, datasource, msqContext);
+    sqlTask = StringUtils.replace(
+        sqlTask,
+        REINDEX_DATASOURCE_STRING_IN_TASK,
+        reindexDatasource
+    );
+    submitTask(sqlTask, reindexDatasource, msqContext);
+    doTestQuery(queryFilePath, reindexDatasource);
   }
 }
diff --git a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITKeyStatisticsSketchMergeMode.java b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITKeyStatisticsSketchMergeMode.java
new file mode 100644
index 000000000000..c0f22f2c762d
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITKeyStatisticsSketchMergeMode.java
@@ -0,0 +1,206 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.testsEx.msq;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.collect.ImmutableMap;
+import com.google.inject.Inject;
+import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.msq.exec.ClusterStatisticsMergeMode;
+import org.apache.druid.msq.sql.SqlTaskStatus;
+import org.apache.druid.msq.util.MultiStageQueryContext;
+import org.apache.druid.sql.http.SqlQuery;
+import org.apache.druid.testing.IntegrationTestingConfig;
+import org.apache.druid.testing.clients.CoordinatorResourceTestClient;
+import org.apache.druid.testing.clients.SqlResourceTestClient;
+import org.apache.druid.testing.utils.DataLoaderHelper;
+import org.apache.druid.testing.utils.MsqTestQueryHelper;
+import org.apache.druid.testsEx.categories.MultiStageQuery;
+import org.apache.druid.testsEx.config.DruidTestRunner;
+import org.junit.Assert;
+import org.junit.Test;
+import org.junit.experimental.categories.Category;
+import org.junit.runner.RunWith;
+
+@RunWith(DruidTestRunner.class)
+@Category(MultiStageQuery.class)
+public class ITKeyStatisticsSketchMergeMode
+{
+  @Inject
+  private MsqTestQueryHelper msqHelper;
+
+  @Inject
+  private SqlResourceTestClient msqClient;
+
+  @Inject
+  private IntegrationTestingConfig config;
+
+  @Inject
+  private ObjectMapper jsonMapper;
+
+  @Inject
+  private DataLoaderHelper dataLoaderHelper;
+
+  @Inject
+  private CoordinatorResourceTestClient coordinatorClient;
+
+  private static final String QUERY_FILE = "/multi-stage-query/wikipedia_msq_select_query1.json";
+
+
+  @Test
+  public void testMsqIngestionParallelMerging() throws Exception
+  {
+    String datasource = "dst";
+
+    // Clear up the datasource from the previous runs
+    coordinatorClient.unloadSegmentsForDataSource(datasource);
+
+    String queryLocal =
+        StringUtils.format(
+            "INSERT INTO %s\n"
+            + "SELECT\n"
+            + "  TIME_PARSE(\"timestamp\") AS __time,\n"
+            + "  isRobot,\n"
+            + "  diffUrl,\n"
+            + "  added,\n"
+            + "  countryIsoCode,\n"
+            + "  regionName,\n"
+            + "  channel,\n"
+            + "  flags,\n"
+            + "  delta,\n"
+            + "  isUnpatrolled,\n"
+            + "  isNew,\n"
+            + "  deltaBucket,\n"
+            + "  isMinor,\n"
+            + "  isAnonymous,\n"
+            + "  deleted,\n"
+            + "  cityName,\n"
+            + "  metroCode,\n"
+            + "  namespace,\n"
+            + "  comment,\n"
+            + "  page,\n"
+            + "  commentLength,\n"
+            + "  countryName,\n"
+            + "  user,\n"
+            + "  regionIsoCode\n"
+            + "FROM TABLE(\n"
+            + "  EXTERN(\n"
+            + "    '{\"type\":\"local\",\"files\":[\"/resources/data/batch_index/json/wikipedia_index_data1.json\"]}',\n"
+            + "    '{\"type\":\"json\"}',\n"
+            + "    '[{\"type\":\"string\",\"name\":\"timestamp\"},{\"type\":\"string\",\"name\":\"isRobot\"},{\"type\":\"string\",\"name\":\"diffUrl\"},{\"type\":\"long\",\"name\":\"added\"},{\"type\":\"string\",\"name\":\"countryIsoCode\"},{\"type\":\"string\",\"name\":\"regionName\"},{\"type\":\"string\",\"name\":\"channel\"},{\"type\":\"string\",\"name\":\"flags\"},{\"type\":\"long\",\"name\":\"delta\"},{\"type\":\"string\",\"name\":\"isUnpatrolled\"},{\"type\":\"string\",\"name\":\"isNew\"},{\"type\":\"double\",\"name\":\"deltaBucket\"},{\"type\":\"string\",\"name\":\"isMinor\"},{\"type\":\"string\",\"name\":\"isAnonymous\"},{\"type\":\"long\",\"name\":\"deleted\"},{\"type\":\"string\",\"name\":\"cityName\"},{\"type\":\"long\",\"name\":\"metroCode\"},{\"type\":\"string\",\"name\":\"namespace\"},{\"type\":\"string\",\"name\":\"comment\"},{\"type\":\"string\",\"name\":\"page\"},{\"type\":\"long\",\"name\":\"commentLength\"},{\"type\":\"string\",\"name\":\"countryName\"},{\"type\":\"string\",\"name\":\"user\"},{\"type\":\"string\",\"name\":\"regionIsoCode\"}]'\n"
+            + "  )\n"
+            + ")\n"
+            + "PARTITIONED BY DAY\n"
+            + "CLUSTERED BY \"__time\"",
+            datasource
+        );
+
+    ImmutableMap<String, Object> context = ImmutableMap.of(
+        MultiStageQueryContext.CTX_CLUSTER_STATISTICS_MERGE_MODE,
+        ClusterStatisticsMergeMode.PARALLEL
+    );
+
+    // Submit the task and wait for the datasource to get loaded
+    SqlQuery sqlQuery = new SqlQuery(queryLocal, null, false, false, false, context, null);
+    SqlTaskStatus sqlTaskStatus = msqHelper.submitMsqTask(sqlQuery);
+
+    if (sqlTaskStatus.getState().isFailure()) {
+      Assert.fail(StringUtils.format(
+          "Unable to start the task successfully.\nPossible exception: %s",
+          sqlTaskStatus.getError()
+      ));
+    }
+
+    msqHelper.pollTaskIdForCompletion(sqlTaskStatus.getTaskId());
+    dataLoaderHelper.waitUntilDatasourceIsReady(datasource);
+
+    msqHelper.testQueriesFromFile(QUERY_FILE, datasource);
+  }
+
+  @Test
+  public void testMsqIngestionSequentialMerging() throws Exception
+  {
+    String datasource = "dst";
+
+    // Clear up the datasource from the previous runs
+    coordinatorClient.unloadSegmentsForDataSource(datasource);
+
+    String queryLocal =
+        StringUtils.format(
+            "INSERT INTO %s\n"
+            + "SELECT\n"
+            + "  TIME_PARSE(\"timestamp\") AS __time,\n"
+            + "  isRobot,\n"
+            + "  diffUrl,\n"
+            + "  added,\n"
+            + "  countryIsoCode,\n"
+            + "  regionName,\n"
+            + "  channel,\n"
+            + "  flags,\n"
+            + "  delta,\n"
+            + "  isUnpatrolled,\n"
+            + "  isNew,\n"
+            + "  deltaBucket,\n"
+            + "  isMinor,\n"
+            + "  isAnonymous,\n"
+            + "  deleted,\n"
+            + "  cityName,\n"
+            + "  metroCode,\n"
+            + "  namespace,\n"
+            + "  comment,\n"
+            + "  page,\n"
+            + "  commentLength,\n"
+            + "  countryName,\n"
+            + "  user,\n"
+            + "  regionIsoCode\n"
+            + "FROM TABLE(\n"
+            + "  EXTERN(\n"
+            + "    '{\"type\":\"local\",\"files\":[\"/resources/data/batch_index/json/wikipedia_index_data1.json\"]}',\n"
+            + "    '{\"type\":\"json\"}',\n"
+            + "    '[{\"type\":\"string\",\"name\":\"timestamp\"},{\"type\":\"string\",\"name\":\"isRobot\"},{\"type\":\"string\",\"name\":\"diffUrl\"},{\"type\":\"long\",\"name\":\"added\"},{\"type\":\"string\",\"name\":\"countryIsoCode\"},{\"type\":\"string\",\"name\":\"regionName\"},{\"type\":\"string\",\"name\":\"channel\"},{\"type\":\"string\",\"name\":\"flags\"},{\"type\":\"long\",\"name\":\"delta\"},{\"type\":\"string\",\"name\":\"isUnpatrolled\"},{\"type\":\"string\",\"name\":\"isNew\"},{\"type\":\"double\",\"name\":\"deltaBucket\"},{\"type\":\"string\",\"name\":\"isMinor\"},{\"type\":\"string\",\"name\":\"isAnonymous\"},{\"type\":\"long\",\"name\":\"deleted\"},{\"type\":\"string\",\"name\":\"cityName\"},{\"type\":\"long\",\"name\":\"metroCode\"},{\"type\":\"string\",\"name\":\"namespace\"},{\"type\":\"string\",\"name\":\"comment\"},{\"type\":\"string\",\"name\":\"page\"},{\"type\":\"long\",\"name\":\"commentLength\"},{\"type\":\"string\",\"name\":\"countryName\"},{\"type\":\"string\",\"name\":\"user\"},{\"type\":\"string\",\"name\":\"regionIsoCode\"}]'\n"
+            + "  )\n"
+            + ")\n"
+            + "PARTITIONED BY DAY\n"
+            + "CLUSTERED BY \"__time\"",
+            datasource
+        );
+
+    ImmutableMap<String, Object> context = ImmutableMap.of(
+        MultiStageQueryContext.CTX_CLUSTER_STATISTICS_MERGE_MODE,
+        ClusterStatisticsMergeMode.SEQUENTIAL
+    );
+
+    // Submit the task and wait for the datasource to get loaded
+    SqlQuery sqlQuery = new SqlQuery(queryLocal, null, false, false, false, context, null);
+    SqlTaskStatus sqlTaskStatus = msqHelper.submitMsqTask(sqlQuery);
+
+    if (sqlTaskStatus.getState().isFailure()) {
+      Assert.fail(StringUtils.format(
+          "Unable to start the task successfully.\nPossible exception: %s",
+          sqlTaskStatus.getError()
+      ));
+    }
+
+    msqHelper.pollTaskIdForCompletion(sqlTaskStatus.getTaskId());
+    dataLoaderHelper.waitUntilDatasourceIsReady(datasource);
+
+    msqHelper.testQueriesFromFile(QUERY_FILE, datasource);
+  }
+}
diff --git a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITMSQReindexTest.java b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITMSQReindexTest.java
new file mode 100644
index 000000000000..26a317ccf148
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITMSQReindexTest.java
@@ -0,0 +1,83 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.testsEx.msq;
+
+import com.google.inject.Inject;
+import junitparams.Parameters;
+import junitparams.naming.TestCaseName;
+import org.apache.commons.io.FilenameUtils;
+import org.apache.curator.shaded.com.google.common.collect.ImmutableMap;
+import org.apache.druid.testing.utils.MsqTestQueryHelper;
+import org.apache.druid.testsEx.categories.MultiStageQuery;
+import org.apache.druid.testsEx.config.DruidTestRunner;
+import org.junit.Test;
+import org.junit.experimental.categories.Category;
+import org.junit.runner.RunWith;
+
+import java.util.Arrays;
+import java.util.List;
+import java.util.Map;
+
+@RunWith(DruidTestRunner.class)
+@Category(MultiStageQuery.class)
+public class ITMSQReindexTest extends AbstractITSQLBasedIngestion
+{
+  private static final String MSQ_TASKS_DIR = "/multi-stage-query/";
+
+  @Inject
+  private MsqTestQueryHelper msqHelper;
+
+  public static List<List<String>> test_cases()
+  {
+    return Arrays.asList(
+        Arrays.asList("wikipedia_index_msq.sql", "wikipedia_reindex_msq.sql", "wikipedia_reindex_queries.json"),
+        Arrays.asList("wikipedia_merge_index_msq.sql", "wikipedia_merge_reindex_msq.sql", "wikipedia_merge_index_queries.json"),
+        Arrays.asList("wikipedia_index_task_with_transform.sql", "wikipedia_reindex_with_transform_msq.sql", "wikipedia_reindex_queries_with_transforms.json")
+    );
+
+  }
+
+  @Test
+  @Parameters(method = "test_cases")
+  @TestCaseName("Test_{index} ({0}, {1}, {2})")
+  public void testMSQDruidInputSource(String sqlFileName, String reIndexSqlFileName, String reIndexQueryFileName)
+  {
+    String indexDatasource = FilenameUtils.removeExtension(sqlFileName);
+    String reindexDatasource = FilenameUtils.removeExtension(reIndexSqlFileName);
+    Map<String, Object> context = ImmutableMap.of("finalizeAggregations", false,
+                                                  "maxNumTasks", 5,
+                                                  "groupByEnableMultiValueUnnesting", false);
+    try {
+      submitTaskFromFile(MSQ_TASKS_DIR + sqlFileName,
+                         indexDatasource,
+                         context);
+
+      runReindexMSQTaskandTestQueries(MSQ_TASKS_DIR + reIndexSqlFileName,
+                                      MSQ_TASKS_DIR + reIndexQueryFileName,
+                                      indexDatasource,
+                                      reindexDatasource,
+                                      context);
+    }
+    catch (Exception e) {
+      LOG.error(e, "Error while testing [%s, %s, %s]", sqlFileName, reIndexSqlFileName, reIndexQueryFileName);
+      throw new RuntimeException(e);
+    }
+  }
+}
diff --git a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITSQLBasedBatchIngestion.java b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITSQLBasedBatchIngestion.java
index dbc26d7d4085..9f7754b2e8df 100644
--- a/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITSQLBasedBatchIngestion.java
+++ b/integration-tests-ex/cases/src/test/java/org/apache/druid/testsEx/msq/ITSQLBasedBatchIngestion.java
@@ -20,6 +20,7 @@
 package org.apache.druid.testsEx.msq;
 
 import junitparams.Parameters;
+import junitparams.naming.TestCaseName;
 import org.apache.commons.io.FilenameUtils;
 import org.apache.curator.shaded.com.google.common.collect.ImmutableMap;
 import org.apache.druid.testsEx.categories.MultiStageQuery;
@@ -35,7 +36,7 @@
 @Category(MultiStageQuery.class)
 public class ITSQLBasedBatchIngestion extends AbstractITSQLBasedIngestion
 {
-  private static final String BATCH_INDEX_TASKS_DIR = "/multi-stage-query/batch-index/";
+  private static final String MSQ_TASKS_DIR = "/multi-stage-query/";
 
   public static List<List<String>> test_cases()
   {
@@ -44,7 +45,7 @@ public static List<List<String>> test_cases()
         Arrays.asList("sparse_column_msq.sql", "sparse_column_msq.json"),
         Arrays.asList("wikipedia_http_inputsource_msq.sql", "wikipedia_http_inputsource_queries.json"),
         Arrays.asList("wikipedia_index_msq.sql", "wikipedia_index_queries.json"),
-        Arrays.asList("wikipedia_merge_index_task.sql", "wikipedia_index_queries.json"),
+        Arrays.asList("wikipedia_merge_index_msq.sql", "wikipedia_merge_index_queries.json"),
         Arrays.asList("wikipedia_index_task_with_transform.sql", "wikipedia_index_queries_with_transform.json")
     );
 
@@ -52,16 +53,17 @@ public static List<List<String>> test_cases()
 
   @Test
   @Parameters(method = "test_cases")
+  @TestCaseName("Test_{index} ({0}, {1})")
   public void testSQLBasedBatchIngestion(String sqlFileName, String queryFileName)
   {
     try {
-      runMSQTaskandTestQueries(BATCH_INDEX_TASKS_DIR + sqlFileName,
-                               BATCH_INDEX_TASKS_DIR + queryFileName,
-                               FilenameUtils.removeExtension(sqlFileName),
-                               ImmutableMap.of("finalizeAggregations", false,
-                                               "maxNumTasks", 5,
-                                               "groupByEnableMultiValueUnnesting", false
-                               ));
+      runMSQTaskandTestQueries(
+          MSQ_TASKS_DIR + sqlFileName,
+          MSQ_TASKS_DIR + queryFileName,
+          FilenameUtils.removeExtension(sqlFileName),
+          ImmutableMap.of("finalizeAggregations", false,
+                          "maxNumTasks", 5,
+                          "groupByEnableMultiValueUnnesting", false));
     }
     catch (Exception e) {
       LOG.error(e, "Error while testing [%s, %s]", sqlFileName, queryFileName);
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/json_path_index_queries.json b/integration-tests-ex/cases/src/test/resources/multi-stage-query/json_path_index_queries.json
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/json_path_index_queries.json
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/json_path_index_queries.json
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/msq_inline.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/msq_inline.sql
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/msq_inline.sql
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/msq_inline.sql
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/sparse_column_msq.json b/integration-tests-ex/cases/src/test/resources/multi-stage-query/sparse_column_msq.json
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/sparse_column_msq.json
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/sparse_column_msq.json
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/sparse_column_msq.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/sparse_column_msq.sql
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/sparse_column_msq.sql
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/sparse_column_msq.sql
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_combining_firehose_index_queries.json b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_combining_firehose_index_queries.json
new file mode 100644
index 000000000000..302d2fea284e
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_combining_firehose_index_queries.json
@@ -0,0 +1,141 @@
+[
+  {
+    "description": "timeseries, 1 agg, all",
+    "query": {
+      "queryType": "timeBoundary",
+      "dataSource": "%%DATASOURCE%%"
+    },
+    "expectedResults": [
+      {
+        "timestamp": "2013-08-31T01:02:33.000Z",
+        "result": {
+          "minTime": "2013-08-31T01:02:33.000Z",
+          "maxTime": "2013-09-01T18:22:39.000Z"
+        }
+      }
+    ]
+  },
+  {
+    "description": "timeseries, datasketch aggs, all",
+    "query": {
+      "queryType": "timeseries",
+      "dataSource": "%%DATASOURCE%%",
+      "granularity": "day",
+      "intervals": [
+        "2013-09-01T00:00/2013-09-02T00:00"
+      ],
+      "filter": null,
+      "aggregations": [
+        {
+          "type": "HLLSketchMerge",
+          "name": "approxCountHLL",
+          "fieldName": "HLLSketchBuild",
+          "lgK": 12,
+          "tgtHllType": "HLL_4",
+          "round": true
+        },
+        {
+          "type": "thetaSketch",
+          "name": "approxCountTheta",
+          "fieldName": "thetaSketch",
+          "size": 16384,
+          "shouldFinalize": true,
+          "isInputThetaSketch": false,
+          "errorBoundsStdDev": null
+        },
+        {
+          "type": "quantilesDoublesSketch",
+          "name": "quantilesSketch",
+          "fieldName": "quantilesDoublesSketch",
+          "k": 128
+        }
+      ]
+    },
+    "expectedResults": [
+      {
+        "timestamp": "2013-09-01T00:00:00.000Z",
+        "result": {
+          "quantilesSketch": 6,
+          "approxCountTheta": 6.0,
+          "approxCountHLL": 6
+        }
+      }
+    ]
+  },
+  {
+    "description": "having spec on post aggregation",
+    "query": {
+      "queryType": "groupBy",
+      "dataSource": "%%DATASOURCE%%",
+      "granularity": "day",
+      "dimensions": [
+        "page"
+      ],
+      "filter": {
+        "type": "selector",
+        "dimension": "language",
+        "value": "zh"
+      },
+      "aggregations": [
+        {
+          "type": "count",
+          "name": "rows"
+        },
+        {
+          "type": "longSum",
+          "fieldName": "added",
+          "name": "added_count"
+        }
+      ],
+      "postAggregations": [
+        {
+          "type": "arithmetic",
+          "name": "added_count_times_ten",
+          "fn": "*",
+          "fields": [
+            {
+              "type": "fieldAccess",
+              "name": "added_count",
+              "fieldName": "added_count"
+            },
+            {
+              "type": "constant",
+              "name": "const",
+              "value": 10
+            }
+          ]
+        }
+      ],
+      "having": {
+        "type": "greaterThan",
+        "aggregation": "added_count_times_ten",
+        "value": 9000
+      },
+      "intervals": [
+        "2013-08-31T00:00/2013-09-01T00:00"
+      ]
+    },
+    "expectedResults": [
+      {
+        "version": "v1",
+        "timestamp": "2013-08-31T00:00:00.000Z",
+        "event": {
+          "added_count_times_ten": 9050.0,
+          "page": "Crimson Typhoon",
+          "added_count": 905,
+          "rows": 1
+        }
+      },
+      {
+        "version": "v1",
+        "timestamp": "2013-08-31T00:00:00.000Z",
+        "event": {
+          "added_count_times_ten": 9770.0,
+          "page": "Gypsy Danger",
+          "added_count": 977,
+          "rows": 1
+        }
+      }
+    ]
+  }
+]
\ No newline at end of file
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_merge_index_task.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_combining_input_source_msq.sql
similarity index 65%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_merge_index_task.sql
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_combining_input_source_msq.sql
index a8160aa9055b..212487d5bf03 100644
--- a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_merge_index_task.sql
+++ b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_combining_input_source_msq.sql
@@ -1,13 +1,8 @@
-REPLACE INTO "%%DATASOURCE%%" OVERWRITE ALL
-WITH "source" AS (SELECT * FROM TABLE(
-  EXTERN(
-    '{"type":"local","baseDir":"/resources/data/batch_index/json","filter":"wikipedia_index_data*"}',
-    '{"type":"json"}',
-    '[{"name":"timestamp","type":"string"},{"name":"page","type":"string"},{"name":"language","type":"string"},{"name":"user","type":"string"},{"name":"unpatrolled","type":"string"},{"name":"newPage","type":"string"},{"name":"robot","type":"string"},{"name":"anonymous","type":"string"},{"name":"namespace","type":"string"},{"name":"continent","type":"string"},{"name":"country","type":"string"},{"name":"region","type":"string"},{"name":"city","type":"string"},{"name":"added","type":"double"},{"name":"deleted","type":"double"},{"name":"delta","type":"double"}]'
-  )
-))
+INSERT INTO "%%REINDEX_DATASOURCE%%"
+
+with externalSource as (
 SELECT
-  TIME_FLOOR(CASE WHEN CAST("timestamp" AS BIGINT) > 0 THEN MILLIS_TO_TIMESTAMP(CAST("timestamp" AS BIGINT)) ELSE TIME_PARSE("timestamp") END, 'PT1S') AS __time,
+TIME_FLOOR(CASE WHEN CAST("timestamp" AS BIGINT) > 0 THEN MILLIS_TO_TIMESTAMP(CAST("timestamp" AS BIGINT)) ELSE TIME_PARSE("timestamp") END, 'PT1S') AS __time,
   "page",
   "language",
   "user",
@@ -20,7 +15,6 @@ SELECT
   "country",
   "region",
   "city",
-  "timestamp",
   COUNT(*) AS "count",
   SUM("added") AS "added",
   SUM("deleted") AS "deleted",
@@ -28,6 +22,15 @@ SELECT
   APPROX_COUNT_DISTINCT_DS_THETA("user") AS "thetaSketch",
   DS_QUANTILES_SKETCH("delta") AS "quantilesDoublesSketch",
   APPROX_COUNT_DISTINCT_DS_HLL("user") AS "HLLSketchBuild"
-FROM "source"
-GROUP BY 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14
+FROM TABLE(
+  EXTERN(
+    '{"type":"local","baseDir":"/resources/indexer","filter":"wikipedia_combining_index_data.json"}',
+    '{"type":"json"}',
+    '[{"name":"timestamp","type":"string"},{"name":"page","type":"string"},{"name":"language","type":"string"},{"name":"user","type":"string"},{"name":"unpatrolled","type":"string"},{"name":"newPage","type":"string"},{"name":"robot","type":"string"},{"name":"anonymous","type":"string"},{"name":"namespace","type":"string"},{"name":"continent","type":"string"},{"name":"country","type":"string"},{"name":"region","type":"string"},{"name":"city","type":"string"},{"name":"added","type":"double"},{"name":"deleted","type":"double"},{"name":"delta","type":"double"}]'
+  )) GROUP BY 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13
+
+  UNION ALL (SELECT * FROM "%%DATASOURCE%%" WHERE TIMESTAMP '2013-08-31' <= "__time" AND "__time" < TIMESTAMP '2013-09-01')
+)
+
+SELECT * FROM externalSource
 PARTITIONED BY DAY
\ No newline at end of file
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_http_inputsource_msq.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_http_inputsource_msq.sql
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_http_inputsource_msq.sql
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_http_inputsource_msq.sql
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_http_inputsource_queries.json b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_http_inputsource_queries.json
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_http_inputsource_queries.json
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_http_inputsource_queries.json
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_index_msq.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_index_msq.sql
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_index_msq.sql
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_index_msq.sql
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_index_queries.json b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_index_queries.json
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_index_queries.json
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_index_queries.json
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_index_queries_with_transform.json b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_index_queries_with_transform.json
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_index_queries_with_transform.json
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_index_queries_with_transform.json
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_index_task_with_transform.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_index_task_with_transform.sql
similarity index 100%
rename from integration-tests-ex/cases/src/test/resources/multi-stage-query/batch-index/wikipedia_index_task_with_transform.sql
rename to integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_index_task_with_transform.sql
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_merge_index_msq.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_merge_index_msq.sql
new file mode 100644
index 000000000000..1e04e38436b5
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_merge_index_msq.sql
@@ -0,0 +1,20 @@
+REPLACE INTO "%%DATASOURCE%%" OVERWRITE ALL
+WITH "source" AS (SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"local","baseDir":"/resources/data/batch_index/json","filter":"wikipedia_index_data*"}',
+    '{"type":"json"}',
+    '[{"name":"timestamp","type":"string"},{"name":"continent","type":"string"},{"name":"added","type":"double"},{"name":"deleted","type":"double"},{"name":"delta","type":"double"},{"name":"user","type":"string"}]'
+  )
+))
+SELECT
+  TIME_FLOOR(CASE WHEN CAST("timestamp" AS BIGINT) > 0 THEN MILLIS_TO_TIMESTAMP(CAST("timestamp" AS BIGINT)) ELSE TIME_PARSE("timestamp") END, 'P1D') AS __time,
+  "continent",
+  COUNT(*) AS "count",
+  SUM("added") AS "added",
+  SUM("deleted") AS "deleted",
+  SUM("delta") AS "delta",
+  EARLIEST("user", 128) AS "first_user",
+  LATEST("user", 128) AS "last_user"
+FROM "source"
+GROUP BY 1, 2
+PARTITIONED BY DAY
\ No newline at end of file
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_merge_index_queries.json b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_merge_index_queries.json
new file mode 100644
index 000000000000..0439b5fdca14
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_merge_index_queries.json
@@ -0,0 +1,42 @@
+[
+  {
+    "description": "groupby, stringFirst/stringLast rollup aggs, all",
+    "query":{
+      "queryType" : "groupBy",
+      "dataSource": "%%DATASOURCE%%",
+      "granularity":"day",
+      "dimensions":[
+        "continent"
+      ],
+      "intervals":[
+        "2013-08-31T00:00/2013-09-01T00:00"
+      ],
+      "filter":{
+        "type":"selector",
+        "dimension":"continent",
+        "value":"Asia"
+      },
+      "aggregations":[
+        {
+          "type": "stringFirst",
+          "name": "earliest_user",
+          "fieldName": "first_user"
+        },
+        {
+          "type":"stringLast",
+          "name":"latest_user",
+          "fieldName":"last_user"
+        }
+      ]
+    },
+    "expectedResults":[ {
+      "version" : "v1",
+      "timestamp" : "2013-08-31T00:00:00.000Z",
+      "event" : {
+        "continent":"Asia",
+        "earliest_user":"masterYi",
+        "latest_user":"stringer"
+      }
+    } ]
+  }
+]
\ No newline at end of file
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_merge_reindex_msq.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_merge_reindex_msq.sql
new file mode 100644
index 000000000000..67417409ca97
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_merge_reindex_msq.sql
@@ -0,0 +1,17 @@
+REPLACE INTO "%%REINDEX_DATASOURCE%%" OVERWRITE ALL
+WITH "source" AS (
+  SELECT *
+  FROM "%%DATASOURCE%%"
+  WHERE TIMESTAMP '2013-08-31' <= "__time" AND "__time" < TIMESTAMP '2013-09-01'
+)
+SELECT
+  "__time",
+  "continent",
+  SUM("added") AS "added",
+  SUM("deleted") AS "deleted",
+  SUM("delta") AS "delta",
+  EARLIEST("first_user", 128) AS "first_user",
+  LATEST("last_user", 128) AS "last_user"
+FROM "source"
+GROUP BY 1, 2
+PARTITIONED BY DAY
\ No newline at end of file
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_msq.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_msq.sql
new file mode 100644
index 000000000000..e4685c63bff9
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_msq.sql
@@ -0,0 +1,24 @@
+REPLACE INTO "%%REINDEX_DATASOURCE%%" OVERWRITE ALL
+WITH "source" AS (
+  SELECT *
+  FROM "%%DATASOURCE%%"
+  WHERE TIMESTAMP '2013-08-31' <= "__time" AND "__time" < TIMESTAMP '2013-09-01'
+)
+SELECT
+  "__time",
+  "page",
+  "language",
+  "user",
+  "unpatrolled",
+  "newPage",
+  "anonymous",
+  "namespace",
+  "country",
+  "region",
+  "city",
+  SUM("added") AS "added",
+  SUM("deleted") AS "deleted",
+  SUM("delta") AS "delta"
+FROM "source"
+GROUP BY 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11
+PARTITIONED BY DAY
\ No newline at end of file
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_queries.json b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_queries.json
new file mode 100644
index 000000000000..38d09adfa965
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_queries.json
@@ -0,0 +1,66 @@
+[
+  {
+    "description": "timeseries, 1 agg, all",
+    "query":{
+      "queryType" : "timeBoundary",
+      "dataSource": "%%DATASOURCE%%"
+    },
+    "expectedResults":[
+      {
+        "timestamp" : "2013-08-31T01:02:33.000Z",
+        "result" : {
+          "minTime" : "2013-08-31T01:02:33.000Z",
+          "maxTime" : "2013-08-31T12:41:27.000Z"
+        }
+      }
+    ]
+  },
+
+  {
+    "description":"having spec on post aggregation",
+    "query":{
+      "queryType":"groupBy",
+      "dataSource":"%%DATASOURCE%%",
+      "granularity":"day",
+      "dimensions":[
+        "page"
+      ],
+      "filter":{
+        "type":"selector",
+        "dimension":"language",
+        "value":"zh"
+      },
+      "aggregations":[
+        {
+          "type":"longSum",
+          "fieldName":"added",
+          "name":"added_count"
+        }
+      ],
+      "postAggregations": [
+        {
+          "type":"arithmetic",
+          "name":"added_count_times_ten",
+          "fn":"*",
+          "fields":[
+            {"type":"fieldAccess", "name":"added_count", "fieldName":"added_count"},
+            {"type":"constant", "name":"const", "value":10}
+          ]
+        }
+      ],
+      "having":{"type":"greaterThan", "aggregation":"added_count_times_ten", "value":9000},
+      "intervals":[
+        "2013-08-31T00:00/2013-09-01T00:00"
+      ]
+    },
+    "expectedResults":[ {
+      "version" : "v1",
+      "timestamp" : "2013-08-31T00:00:00.000Z",
+      "event" : {
+        "added_count_times_ten" : 9050.0,
+        "page" : "Crimson Typhoon",
+        "added_count" : 905
+      }
+    } ]
+  }
+]
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_queries_with_transforms.json b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_queries_with_transforms.json
new file mode 100644
index 000000000000..fc8a181e7249
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_queries_with_transforms.json
@@ -0,0 +1,79 @@
+[
+  {
+    "description": "timeseries, 1 agg, all",
+    "query":{
+      "queryType" : "timeBoundary",
+      "dataSource": "%%DATASOURCE%%"
+    },
+    "expectedResults":[
+      {
+        "timestamp" : "2013-08-31T01:02:33.000Z",
+        "result" : {
+          "minTime" : "2013-08-31T01:02:33.000Z",
+          "maxTime" : "2013-08-31T12:41:27.000Z"
+        }
+      }
+    ]
+  },
+  {
+    "description":"having spec on post aggregation",
+    "query":{
+      "queryType":"groupBy",
+      "dataSource":"%%DATASOURCE%%",
+      "granularity":"day",
+      "dimensions":[
+        "newPage",
+        "city"
+      ],
+      "filter":{
+        "type":"selector",
+        "dimension":"language",
+        "value":"language-zh"
+      },
+      "aggregations":[
+        {
+          "type":"longSum",
+          "fieldName":"one-plus-triple-added",
+          "name":"added_count"
+        },
+        {
+          "type":"longSum",
+          "fieldName":"double-deleted",
+          "name":"double_deleted_count"
+        },
+        {
+          "type":"longSum",
+          "fieldName":"delta",
+          "name":"delta_overshadowed"
+        }
+      ],
+      "postAggregations": [
+        {
+          "type":"arithmetic",
+          "name":"added_count_times_ten",
+          "fn":"*",
+          "fields":[
+            {"type":"fieldAccess", "name":"added_count", "fieldName":"added_count"},
+            {"type":"constant", "name":"const", "value":10}
+          ]
+        }
+      ],
+      "having":{"type":"greaterThan", "aggregation":"added_count_times_ten", "value":9000},
+      "intervals":[
+        "2013-08-31T00:00/2013-09-01T00:00"
+      ]
+    },
+    "expectedResults":[ {
+      "version" : "v1",
+      "timestamp" : "2013-08-31T00:00:00.000Z",
+      "event" : {
+        "added_count_times_ten" : 27160.0,
+        "newPage" : "Crimson Typhoon",
+        "city" : "city-Taiyuan",
+        "double_deleted_count" : 10,
+        "delta_overshadowed" : 450,
+        "added_count" : 2716
+      }
+    } ]
+  }
+]
diff --git a/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_with_transform_msq.sql b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_with_transform_msq.sql
new file mode 100644
index 000000000000..565a9a2bbcbb
--- /dev/null
+++ b/integration-tests-ex/cases/src/test/resources/multi-stage-query/wikipedia_reindex_with_transform_msq.sql
@@ -0,0 +1,27 @@
+REPLACE INTO "%%REINDEX_DATASOURCE%%" OVERWRITE ALL
+WITH "source" AS (
+  SELECT *
+  FROM "%%DATASOURCE%%"
+  WHERE TIMESTAMP '2013-08-31' <= "__time" AND "__time" < TIMESTAMP '2013-09-01'
+)
+SELECT
+  "__time",
+  "language",
+  "user",
+  "unpatrolled",
+  "page",
+  "page" AS "newPage",
+  "anonymous",
+  "namespace",
+  "country",
+  "region",
+  concat('city-', city) AS "city",
+  SUM("added") AS "added",
+  SUM("triple-added") AS "triple-added",
+  SUM("triple-added" + 1) AS "one-plus-triple-added",
+  SUM("deleted") AS "deleted",
+  SUM("deleted" * 2) AS "double-deleted",
+  SUM("delta" / 2) AS "delta"
+FROM "source"
+GROUP BY 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11
+PARTITIONED BY DAY
\ No newline at end of file
diff --git a/integration-tests-ex/image/pom.xml b/integration-tests-ex/image/pom.xml
index 649367f056af..2fbeba3935a4 100644
--- a/integration-tests-ex/image/pom.xml
+++ b/integration-tests-ex/image/pom.xml
@@ -46,7 +46,7 @@ Reference: https://dzone.com/articles/build-docker-image-from-maven
     <parent>
         <artifactId>druid</artifactId>
         <groupId>org.apache.druid</groupId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
         <relativePath>../../pom.xml</relativePath>
     </parent>
 
diff --git a/integration-tests-ex/tools/pom.xml b/integration-tests-ex/tools/pom.xml
index fe7777ebf11f..aa79b786f80b 100644
--- a/integration-tests-ex/tools/pom.xml
+++ b/integration-tests-ex/tools/pom.xml
@@ -31,7 +31,7 @@
 	<parent>
 		<groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-		<version>25.0.0-SNAPSHOT</version>
+		<version>26.0.0-SNAPSHOT</version>
 		<relativePath>../../pom.xml</relativePath>
 	</parent>
 
diff --git a/integration-tests/pom.xml b/integration-tests/pom.xml
index 4dc88f517f1a..ea80d69d0707 100644
--- a/integration-tests/pom.xml
+++ b/integration-tests/pom.xml
@@ -28,7 +28,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
     </parent>
 
     <repositories>
diff --git a/integration-tests/src/main/java/org/apache/druid/testing/utils/DataLoaderHelper.java b/integration-tests/src/main/java/org/apache/druid/testing/utils/DataLoaderHelper.java
index 76b4300067ea..692ab962e62d 100644
--- a/integration-tests/src/main/java/org/apache/druid/testing/utils/DataLoaderHelper.java
+++ b/integration-tests/src/main/java/org/apache/druid/testing/utils/DataLoaderHelper.java
@@ -21,10 +21,12 @@
 
 import com.google.inject.Inject;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.testing.clients.CoordinatorResourceTestClient;
 
 public final class DataLoaderHelper
 {
+  private static final Logger LOG = new Logger(SqlTestQueryHelper.class);
   @Inject
   private SqlTestQueryHelper sqlTestQueryHelper;
 
@@ -33,6 +35,7 @@ public final class DataLoaderHelper
 
   public void waitUntilDatasourceIsReady(String datasource)
   {
+    LOG.info("Waiting for Segments to load for datasource [%s]", datasource);
     ITRetryUtil.retryUntilTrue(
         () -> coordinator.areSegmentsLoaded(datasource),
         StringUtils.format(
@@ -40,10 +43,13 @@ public void waitUntilDatasourceIsReady(String datasource)
             datasource
         )
     );
+    LOG.info("Segments loaded for datasource [%s]", datasource);
 
+    LOG.info("Waiting for datasource [%s] to be ready for SQL queries", datasource);
     ITRetryUtil.retryUntilTrue(
         () -> sqlTestQueryHelper.isDatasourceLoadedInSQL(datasource),
         StringUtils.format("Waiting for [%s] to be ready for SQL queries", datasource)
     );
+    LOG.info("Datasource [%s] ready for SQL queries", datasource);
   }
 }
diff --git a/integration-tests/src/main/java/org/apache/druid/testing/utils/SqlTestQueryHelper.java b/integration-tests/src/main/java/org/apache/druid/testing/utils/SqlTestQueryHelper.java
index fe9a3243c5f3..962b4a103d06 100644
--- a/integration-tests/src/main/java/org/apache/druid/testing/utils/SqlTestQueryHelper.java
+++ b/integration-tests/src/main/java/org/apache/druid/testing/utils/SqlTestQueryHelper.java
@@ -58,7 +58,7 @@ public boolean isDatasourceLoadedInSQL(String datasource)
         null,
         null
     );
-
+    
     try {
       //noinspection unchecked
       queryClient.query(getQueryURL(broker), query);
diff --git a/owasp-dependency-check-suppressions.xml b/owasp-dependency-check-suppressions.xml
index 6ffb3b9f2e1f..a09ed507cc83 100644
--- a/owasp-dependency-check-suppressions.xml
+++ b/owasp-dependency-check-suppressions.xml
@@ -88,6 +88,17 @@
     <packageUrl regex="true">^pkg:maven/net\.minidev/accessors\-smart@.*$</packageUrl>
     <cve>CVE-2021-27568</cve>
   </suppress>
+  <suppress>
+    <!--
+      Suppressing for patch release 24.0.1
+      -->
+    <notes><![CDATA[
+   file name: jackson-databind-2.10.5.1.jar
+   ]]></notes>
+    <packageUrl regex="true">^pkg:maven/com\.fasterxml\.jackson\.core/jackson\-databind@.*$</packageUrl>
+    <cve>CVE-2022-42003</cve>
+    <cve>CVE-2022-42004</cve>
+  </suppress>
 
 
   <suppress>
@@ -209,6 +220,15 @@
       <cve>CVE-2018-1320</cve>
       <cve>CVE-2019-0205</cve>
   </suppress>
+  <suppress>
+    <!-- TODO: Fix by using com.datastax.oss:java-driver-core instead of com.netflix.astyanax:astyanax in extensions-contrib/cassandra-storage     -->
+    <notes><![CDATA[
+    file name: jettison-1.*.jar
+    ]]></notes>
+    <packageUrl regex="true">^pkg:maven/org\.codehaus\.jettison/jettison@1.*$</packageUrl>
+    <cve>CVE-2022-40149</cve>
+    <cve>CVE-2022-40150</cve>
+  </suppress>
   <suppress>
     <!-- TODO: Fix by using com.datastax.oss:java-driver-core instead of com.netflix.astyanax:astyanax in extensions-contrib/cassandra-storage -->
     <notes><![CDATA[
@@ -304,6 +324,13 @@
     <cve>CVE-2019-12399</cve>
     <cve>CVE-2018-17196</cve>
   </suppress>
+  <suppress>
+    <notes><![CDATA[
+    file name: kafka-clients-3.2.0.jar
+    ]]></notes>
+    <packageUrl regex="true">^pkg:maven/org\.apache\.kafka/kafka\-clients@.*$</packageUrl>
+    <cve>CVE-2022-34917</cve>
+  </suppress>
   <suppress>
     <!--
       ~ TODO: Fix when Apache Ranger is released with updated log4j
@@ -418,8 +445,17 @@
      <packageUrl regex="true">^pkg:maven/org\.codehaus\.jackson/jackson-(xc|jaxrs)@1.9.*$</packageUrl>
      <cve>CVE-2018-14718</cve>
      <cve>CVE-2018-7489</cve>
+     <cve>CVE-2022-42003</cve>
+     <cve>CVE-2022-42004</cve>
+  </suppress>
+  <suppress>
+    <!-- aliyun-oss -->
+    <notes><![CDATA[
+    file name: ini4j-0.5.4.jar
+    ]]></notes>
+    <packageUrl regex="true">^pkg:maven/org\.ini4j/ini4j@.*$</packageUrl>
+    <vulnerabilityName>CVE-2022-41404</vulnerabilityName>
   </suppress>
-
   <suppress>
     <!-- Transitive dependency from apache-ranger, latest ranger version 2.1.0 still uses solr 7.7.1-->
     <notes><![CDATA[
@@ -622,8 +658,15 @@
    file name: avatica-server-1.17.0.jar
    ]]></notes>
     <cve>CVE-2022-36364</cve>
+    <cve>CVE-2022-39135</cve>
+  </suppress>
+  <suppress>
+    <notes><![CDATA[
+    file name: calcite-core-1.21.0.jar
+    ]]></notes>
+    <packageUrl regex="true">^pkg:maven/org\.apache\.calcite/calcite\-core@.*$</packageUrl>
+    <cve>CVE-2020-13955</cve>
   </suppress>
-
   <suppress>
     <!-- False positive. 42.3.3 is not affected by the CVE. And we don't use Resultset.refreshRow method either  -->
     <notes><![CDATA[
@@ -631,7 +674,6 @@
    ]]></notes>
     <cve>CVE-2022-31197</cve>
   </suppress>
-
   <suppress>
     <!-- avatica-server-1.17.0.jar -->
     <notes><![CDATA[
@@ -666,4 +708,56 @@
     <vulnerabilityName>1084597</vulnerabilityName>
   </suppress>
 
+  <suppress>
+     <notes><![CDATA[
+     file name: d3-color:2.0.0
+     ]]></notes>
+     <packageUrl regex="true">^pkg:npm/d3\-color@.*$</packageUrl>
+     <vulnerabilityName>1084597</vulnerabilityName>
+   </suppress>
+   <suppress>
+     <notes><![CDATA[
+     file name: protobuf-java-3.11.0.jar
+     ]]></notes>
+     <packageUrl regex="true">^pkg:maven/com\.google\.protobuf/protobuf\-java@.*$</packageUrl>
+     <cve>CVE-2022-3171</cve>
+   </suppress>
+   <suppress>
+     <notes><![CDATA[
+     file name: protobuf-java-util-3.11.0.jar
+     ]]></notes>
+     <packageUrl regex="true">^pkg:maven/com\.google\.protobuf/protobuf\-java\-util@.*$</packageUrl>
+     <cve>CVE-2022-3171</cve>
+   </suppress>
+   <suppress>
+     <notes><![CDATA[
+     file name: ansi-regex:5.0.0
+     ]]></notes>
+     <packageUrl regex="true">^pkg:npm/ansi\-regex@.*$</packageUrl>
+     <vulnerabilityName>1084697</vulnerabilityName>
+     <cve>CVE-2021-3807</cve>
+   </suppress>
+   <suppress>
+     <notes><![CDATA[
+     file name: glob-parent:5.1.1
+     ]]></notes>
+     <packageUrl regex="true">^pkg:npm/glob\-parent@.*$</packageUrl>
+     <vulnerabilityName>1081884</vulnerabilityName>
+     <cve>CVE-2020-28469</cve>
+   </suppress>
+   <suppress>
+     <notes><![CDATA[
+     file name: minimatch:3.0.4
+     ]]></notes>
+     <packageUrl regex="true">^pkg:npm/minimatch@.*$</packageUrl>
+     <vulnerabilityName>1084765</vulnerabilityName>
+   </suppress>
+   <suppress>
+     <notes><![CDATA[
+     file name: y18n:4.0.0
+     ]]></notes>
+     <packageUrl regex="true">^pkg:npm/y18n@.*$</packageUrl>
+     <vulnerabilityName>1070209</vulnerabilityName>
+     <cve>CVE-2020-7774</cve>
+   </suppress>
 </suppressions>
diff --git a/pom.xml b/pom.xml
index 9cddaf49cb3b..5e44487413d2 100644
--- a/pom.xml
+++ b/pom.xml
@@ -29,7 +29,7 @@
 
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
     <packaging>pom</packaging>
 
     <name>Druid</name>
diff --git a/processing/pom.xml b/processing/pom.xml
index c05e15499853..99d1b404e560 100644
--- a/processing/pom.xml
+++ b/processing/pom.xml
@@ -28,7 +28,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
     </parent>
 
     <dependencies>
diff --git a/processing/src/main/java/org/apache/druid/frame/key/RowKeyReader.java b/processing/src/main/java/org/apache/druid/frame/key/RowKeyReader.java
index d3ca6d035c49..3102b103c9c7 100644
--- a/processing/src/main/java/org/apache/druid/frame/key/RowKeyReader.java
+++ b/processing/src/main/java/org/apache/druid/frame/key/RowKeyReader.java
@@ -130,6 +130,28 @@ public boolean hasMultipleValues(final RowKey key, final int fieldNumber)
     }
   }
 
+  /**
+   * Trims the key reader to a particular fieldCount. Used to read keys trimmed by {@link #trim(RowKey, int)}.
+   */
+  public RowKeyReader trimmedKeyReader(int trimmedFieldCount)
+  {
+    final RowSignature.Builder newSignature = RowSignature.builder();
+
+    if (trimmedFieldCount > signature.size()) {
+      throw new IAE("Cannot trim to [%,d] fields, only have [%,d] fields", trimmedFieldCount, signature);
+    }
+
+    for (int i = 0; i < trimmedFieldCount; i++) {
+      final String columnName = signature.getColumnName(i);
+      final ColumnType columnType =
+          Preconditions.checkNotNull(signature.getColumnType(i).orElse(null), "Type for column [%s]", columnName);
+
+      newSignature.add(columnName, columnType);
+    }
+
+    return RowKeyReader.create(newSignature.build());
+  }
+
   /**
    * Trim a key to a particular fieldCount. The returned key may be a copy, but is not guaranteed to be.
    */
diff --git a/processing/src/main/java/org/apache/druid/frame/read/columnar/ComplexFrameColumnReader.java b/processing/src/main/java/org/apache/druid/frame/read/columnar/ComplexFrameColumnReader.java
index f7b662d42bb2..e4a39c16f753 100644
--- a/processing/src/main/java/org/apache/druid/frame/read/columnar/ComplexFrameColumnReader.java
+++ b/processing/src/main/java/org/apache/druid/frame/read/columnar/ComplexFrameColumnReader.java
@@ -22,7 +22,7 @@
 import com.google.common.primitives.Ints;
 import org.apache.datasketches.memory.Memory;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.write.columnar.ComplexFrameColumnWriter;
+import org.apache.druid.frame.write.columnar.ComplexFrameMaker;
 import org.apache.druid.frame.write.columnar.FrameColumnWriters;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
@@ -53,10 +53,10 @@ public ColumnPlus readColumn(final Frame frame)
     final Memory memory = frame.region(columnNumber);
     validate(memory, frame.numRows());
 
-    final int typeNameLength = memory.getInt(ComplexFrameColumnWriter.TYPE_NAME_LENGTH_POSITION);
+    final int typeNameLength = memory.getInt(ComplexFrameMaker.TYPE_NAME_LENGTH_POSITION);
     final byte[] typeNameBytes = new byte[typeNameLength];
 
-    memory.getByteArray(ComplexFrameColumnWriter.TYPE_NAME_POSITION, typeNameBytes, 0, typeNameLength);
+    memory.getByteArray(ComplexFrameMaker.TYPE_NAME_POSITION, typeNameBytes, 0, typeNameLength);
 
     final String typeName = StringUtils.fromUtf8(typeNameBytes);
     final ComplexMetricSerde serde = ComplexMetrics.getSerdeForType(typeName);
@@ -84,7 +84,7 @@ public ColumnPlus readColumn(final Frame frame)
 
   private void validate(final Memory region, final int numRows)
   {
-    if (region.getCapacity() < ComplexFrameColumnWriter.TYPE_NAME_POSITION) {
+    if (region.getCapacity() < ComplexFrameMaker.TYPE_NAME_POSITION) {
       throw new ISE("Column is not big enough for a header");
     }
 
@@ -93,9 +93,9 @@ private void validate(final Memory region, final int numRows)
       throw new ISE("Column does not have the correct type code");
     }
 
-    final int typeNameLength = region.getInt(ComplexFrameColumnWriter.TYPE_NAME_LENGTH_POSITION);
+    final int typeNameLength = region.getInt(ComplexFrameMaker.TYPE_NAME_LENGTH_POSITION);
     if (region.getCapacity() <
-        ComplexFrameColumnWriter.TYPE_NAME_POSITION + typeNameLength + (long) numRows * Integer.BYTES) {
+        ComplexFrameMaker.TYPE_NAME_POSITION + typeNameLength + (long) numRows * Integer.BYTES) {
       throw new ISE("Column is missing offset section");
     }
   }
@@ -198,7 +198,7 @@ private Object getObjectForPhysicalRow(final int physicalRow)
             startOfDataSection + memory.getInt(startOfOffsetSection + (long) Integer.BYTES * (physicalRow - 1));
       }
 
-      if (memory.getByte(startOffset) == ComplexFrameColumnWriter.NULL_MARKER) {
+      if (memory.getByte(startOffset) == ComplexFrameMaker.NULL_MARKER) {
         return null;
       } else {
         final int payloadLength = Ints.checkedCast(endOffset - startOffset - Byte.BYTES);
diff --git a/processing/src/main/java/org/apache/druid/frame/read/columnar/DoubleFrameColumnReader.java b/processing/src/main/java/org/apache/druid/frame/read/columnar/DoubleFrameColumnReader.java
index a8f08feaa6a4..8ac4b1d15d65 100644
--- a/processing/src/main/java/org/apache/druid/frame/read/columnar/DoubleFrameColumnReader.java
+++ b/processing/src/main/java/org/apache/druid/frame/read/columnar/DoubleFrameColumnReader.java
@@ -22,7 +22,7 @@
 import org.apache.datasketches.memory.Memory;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.write.columnar.DoubleFrameColumnWriter;
+import org.apache.druid.frame.write.columnar.DoubleFrameMaker;
 import org.apache.druid.frame.write.columnar.FrameColumnWriters;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.query.monomorphicprocessing.RuntimeShapeInspector;
@@ -69,7 +69,7 @@ private void validate(final Memory region, final int numRows)
     final long memorySize = region.getCapacity();
 
     // Check if column is big enough for a header
-    if (memorySize < DoubleFrameColumnWriter.DATA_OFFSET) {
+    if (memorySize < DoubleFrameMaker.DATA_OFFSET) {
       throw new ISE("Column is not big enough for a header");
     }
 
@@ -79,10 +79,10 @@ private void validate(final Memory region, final int numRows)
     }
 
     final boolean hasNulls = getHasNulls(region);
-    final int sz = DoubleFrameColumnWriter.valueSize(hasNulls);
+    final int sz = DoubleFrameMaker.valueSize(hasNulls);
 
     // Check column length again, now that we know exactly how long it should be.
-    if (memorySize != DoubleFrameColumnWriter.DATA_OFFSET + (long) sz * numRows) {
+    if (memorySize != DoubleFrameMaker.DATA_OFFSET + (long) sz * numRows) {
       throw new ISE("Column does not have the correct length");
     }
   }
@@ -108,9 +108,9 @@ private DoubleFrameColumn(
     {
       this.frame = frame;
       this.hasNulls = hasNulls;
-      this.sz = DoubleFrameColumnWriter.valueSize(hasNulls);
+      this.sz = DoubleFrameMaker.valueSize(hasNulls);
       this.memory = memory;
-      this.memoryPosition = DoubleFrameColumnWriter.DATA_OFFSET;
+      this.memoryPosition = DoubleFrameMaker.DATA_OFFSET;
     }
 
     @Override
diff --git a/processing/src/main/java/org/apache/druid/frame/read/columnar/FloatFrameColumnReader.java b/processing/src/main/java/org/apache/druid/frame/read/columnar/FloatFrameColumnReader.java
index dc5c7fa18f27..0f1d09f57bc5 100644
--- a/processing/src/main/java/org/apache/druid/frame/read/columnar/FloatFrameColumnReader.java
+++ b/processing/src/main/java/org/apache/druid/frame/read/columnar/FloatFrameColumnReader.java
@@ -22,7 +22,7 @@
 import org.apache.datasketches.memory.Memory;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.frame.Frame;
-import org.apache.druid.frame.write.columnar.FloatFrameColumnWriter;
+import org.apache.druid.frame.write.columnar.FloatFrameMaker;
 import org.apache.druid.frame.write.columnar.FrameColumnWriters;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.query.monomorphicprocessing.RuntimeShapeInspector;
@@ -69,7 +69,7 @@ private void validate(final Memory region, final int numRows)
     final long memorySize = region.getCapacity();
 
     // Check if column is big enough for a header
-    if (memorySize < FloatFrameColumnWriter.DATA_OFFSET) {
+    if (memorySize < FloatFrameMaker.DATA_OFFSET) {
       throw new ISE("Column is not big enough for a header");
     }
 
@@ -79,10 +79,10 @@ private void validate(final Memory region, final int numRows)
     }
 
     final boolean hasNulls = getHasNulls(region);
-    final int sz = FloatFrameColumnWriter.valueSize(hasNulls);
+    final int sz = FloatFrameMaker.valueSize(hasNulls);
 
     // Check column length again, now that we know exactly how long it should be.
-    if (memorySize != FloatFrameColumnWriter.DATA_OFFSET + (long) sz * numRows) {
+    if (memorySize != FloatFrameMaker.DATA_OFFSET + (long) sz * numRows) {
       throw new ISE("Column does not have the correct length");
     }
   }
@@ -108,9 +108,9 @@ private FloatFrameColumn(
     {
       this.frame = frame;
       this.hasNulls = hasNulls;
-      this.sz = FloatFrameColumnWriter.valueSize(hasNulls);
+      this.sz = FloatFrameMaker.valueSize(hasNulls);
       this.memory = memory;
-      this.memoryPosition = FloatFrameColumnWriter.DATA_OFFSET;
+      this.memoryPosition = FloatFrameMaker.DATA_OFFSET;
     }
 
     @Override
diff --git a/processing/src/main/java/org/apache/druid/frame/read/columnar/LongFrameColumnReader.java b/processing/src/main/java/org/apache/druid/frame/read/columnar/LongFrameColumnReader.java
index 91bd898597bf..1662411b912b 100644
--- a/processing/src/main/java/org/apache/druid/frame/read/columnar/LongFrameColumnReader.java
+++ b/processing/src/main/java/org/apache/druid/frame/read/columnar/LongFrameColumnReader.java
@@ -23,7 +23,7 @@
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.frame.Frame;
 import org.apache.druid.frame.write.columnar.FrameColumnWriters;
-import org.apache.druid.frame.write.columnar.LongFrameColumnWriter;
+import org.apache.druid.frame.write.columnar.LongFrameMaker;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.query.monomorphicprocessing.RuntimeShapeInspector;
 import org.apache.druid.segment.ColumnValueSelector;
@@ -67,7 +67,7 @@ public ColumnPlus readColumn(final Frame frame)
   private void validate(final Memory region, final int numRows)
   {
     // Check if column is big enough for a header
-    if (region.getCapacity() < LongFrameColumnWriter.DATA_OFFSET) {
+    if (region.getCapacity() < LongFrameMaker.DATA_OFFSET) {
       throw new ISE("Column is not big enough for a header");
     }
 
@@ -77,10 +77,10 @@ private void validate(final Memory region, final int numRows)
     }
 
     final boolean hasNulls = getHasNulls(region);
-    final int sz = LongFrameColumnWriter.valueSize(hasNulls);
+    final int sz = LongFrameMaker.valueSize(hasNulls);
 
     // Check column length again, now that we know exactly how long it should be.
-    if (region.getCapacity() != LongFrameColumnWriter.DATA_OFFSET + (long) sz * numRows) {
+    if (region.getCapacity() != LongFrameMaker.DATA_OFFSET + (long) sz * numRows) {
       throw new ISE("Column does not have the correct length");
     }
   }
@@ -106,9 +106,9 @@ private LongFrameColumn(
     {
       this.frame = frame;
       this.hasNulls = hasNulls;
-      this.sz = LongFrameColumnWriter.valueSize(hasNulls);
+      this.sz = LongFrameMaker.valueSize(hasNulls);
       this.memory = memory;
-      this.memoryPosition = LongFrameColumnWriter.DATA_OFFSET;
+      this.memoryPosition = LongFrameMaker.DATA_OFFSET;
     }
 
     @Override
diff --git a/processing/src/main/java/org/apache/druid/frame/write/FrameWriter.java b/processing/src/main/java/org/apache/druid/frame/write/FrameWriter.java
index 5de131946d5e..f37ed8571ac1 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/FrameWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/FrameWriter.java
@@ -34,9 +34,9 @@ public interface FrameWriter extends Closeable
 {
   /**
    * Write the current row to the frame that is under construction, if there is enough space to do so.
-   *
+   * <p>
    * If this method returns false on an empty frame, or in a situation where starting a new frame is impractical,
-   * it is conventional (although not required) for the caller to throw {@link FrameRowTooLargeException}.
+   * it is conventional (although not required) for the caller to throw {@link org.apache.druid.frame.processor.FrameRowTooLargeException}.
    *
    * @return true if the row was written, false if there was not enough space
    */
diff --git a/processing/src/main/java/org/apache/druid/frame/write/RowBasedFrameWriter.java b/processing/src/main/java/org/apache/druid/frame/write/RowBasedFrameWriter.java
index 2bf4b343080c..2a8af4b9e8f8 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/RowBasedFrameWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/RowBasedFrameWriter.java
@@ -32,6 +32,7 @@
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.io.Closer;
+import org.apache.druid.java.util.common.parsers.ParseException;
 import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.utils.CloseableUtils;
 
@@ -118,8 +119,13 @@ public boolean addSelection()
       return false;
     }
 
-    if (!writeData()) {
-      return false;
+    try {
+      if (!writeData()) {
+        return false;
+      }
+    }
+    catch (Exception e) {
+      throw new ParseException("", e, "Unable to add the row to the frame. Type conversion might be required.");
     }
 
     final MemoryRange<WritableMemory> rowOffsetCursor = rowOffsetMemory.cursor();
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/ColumnarFrameWriter.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/ColumnarFrameWriter.java
index 76f5a17d27af..eff5213ae100 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/columnar/ColumnarFrameWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/ColumnarFrameWriter.java
@@ -30,6 +30,7 @@
 import org.apache.druid.frame.write.FrameWriter;
 import org.apache.druid.frame.write.FrameWriterUtils;
 import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.parsers.ParseException;
 import org.apache.druid.segment.column.RowSignature;
 
 import javax.annotation.Nullable;
@@ -74,11 +75,16 @@ public boolean addSelection()
     }
 
     int i = 0;
-    for (; i < columnWriters.size(); i++) {
-      if (!columnWriters.get(i).addSelection()) {
-        break;
+    try {
+      for (; i < columnWriters.size(); i++) {
+        if (!columnWriters.get(i).addSelection()) {
+          break;
+        }
       }
     }
+    catch (Exception e) {
+      throw new ParseException("", e, "Unable to add the row to the frame. Type conversion might be required.");
+    }
 
     if (i < columnWriters.size()) {
       // Add failed, clean up.
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/ComplexFrameColumnWriter.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/ComplexFrameColumnWriter.java
index 08a8aa0b67b4..6e6b985334df 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/columnar/ComplexFrameColumnWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/ComplexFrameColumnWriter.java
@@ -19,14 +19,9 @@
 
 package org.apache.druid.frame.write.columnar;
 
-import com.google.common.primitives.Ints;
-import it.unimi.dsi.fastutil.bytes.ByteArrays;
 import org.apache.datasketches.memory.WritableMemory;
-import org.apache.druid.frame.allocation.AppendableMemory;
 import org.apache.druid.frame.allocation.MemoryAllocator;
-import org.apache.druid.frame.allocation.MemoryRange;
 import org.apache.druid.frame.read.columnar.ComplexFrameColumnReader;
-import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.segment.BaseObjectColumnValueSelector;
 import org.apache.druid.segment.serde.ComplexMetricSerde;
@@ -38,22 +33,9 @@
  */
 public class ComplexFrameColumnWriter implements FrameColumnWriter
 {
-  // Less than half of AppendableMemory.DEFAULT_INITIAL_ALLOCATION_SIZE.
-  // This guarantees we can fit a WorkerMemoryParmeters.MAX_FRAME_COLUMNS number of columns into a frame.
-  private static final int INITIAL_ALLOCATION_SIZE = 128;
-
-  public static final byte NOT_NULL_MARKER = 0x00;
-  public static final byte NULL_MARKER = 0x01;
-  public static final int TYPE_NAME_LENGTH_POSITION = Byte.BYTES;
-  public static final int TYPE_NAME_POSITION = Byte.BYTES + Integer.BYTES;
-
   private final ComplexMetricSerde serde;
   private final BaseObjectColumnValueSelector<?> selector;
-  private final AppendableMemory offsetMemory;
-  private final AppendableMemory dataMemory;
-  private final byte[] typeNameBytes;
-
-  private int lastDataLength = -1;
+  private final ComplexFrameMaker maker;
 
   ComplexFrameColumnWriter(
       final BaseObjectColumnValueSelector<?> selector,
@@ -63,95 +45,37 @@ public class ComplexFrameColumnWriter implements FrameColumnWriter
   {
     this.selector = selector;
     this.serde = serde;
-    this.offsetMemory = AppendableMemory.create(allocator, INITIAL_ALLOCATION_SIZE);
-    this.dataMemory = AppendableMemory.create(allocator, INITIAL_ALLOCATION_SIZE);
-    this.typeNameBytes = StringUtils.toUtf8(serde.getTypeName());
+    this.maker = new ComplexFrameMaker(allocator, StringUtils.toUtf8(serde.getTypeName()));
   }
 
   @Override
   public boolean addSelection()
   {
-    if (!offsetMemory.reserveAdditional(Integer.BYTES)) {
-      return false;
-    }
-
     final Object complexObject = selector.getObject();
-    final byte[] complexBytes = complexObject == null ? ByteArrays.EMPTY_ARRAY : serde.toBytes(complexObject);
-
-    if (complexBytes.length == Integer.MAX_VALUE) {
-      // Cannot handle objects this large.
-      return false;
-    }
-
-    final int dataLength = complexBytes.length + 1;
-
-    if (dataMemory.size() + dataLength > Integer.MAX_VALUE || !(dataMemory.reserveAdditional(dataLength))) {
-      return false;
-    }
-
-    // All space is reserved. Start writing.
-    final MemoryRange<WritableMemory> offsetCursor = offsetMemory.cursor();
-    offsetCursor.memory().putInt(offsetCursor.start(), Ints.checkedCast(dataMemory.size() + dataLength));
-    offsetMemory.advanceCursor(Integer.BYTES);
-
-    final MemoryRange<WritableMemory> dataCursor = dataMemory.cursor();
-    dataCursor.memory().putByte(dataCursor.start(), complexObject == null ? NULL_MARKER : NOT_NULL_MARKER);
-    dataCursor.memory().putByteArray(dataCursor.start() + 1, complexBytes, 0, complexBytes.length);
-    dataMemory.advanceCursor(dataLength);
-
-    lastDataLength = dataLength;
-    return true;
+    return maker.add(complexObject == null ? null : serde.toBytes(complexObject));
   }
 
   @Override
   public void undo()
   {
-    if (lastDataLength == -1) {
-      throw new ISE("Nothing to undo");
-    }
-
-    offsetMemory.rewindCursor(Integer.BYTES);
-    dataMemory.rewindCursor(lastDataLength);
-    lastDataLength = -1;
+    maker.undo();
   }
 
   @Override
   public long size()
   {
-    return headerSize() + offsetMemory.size() + dataMemory.size();
+    return maker.size();
   }
 
   @Override
   public long writeTo(final WritableMemory memory, final long startPosition)
   {
-    long currentPosition = startPosition;
-
-    memory.putByte(currentPosition, FrameColumnWriters.TYPE_COMPLEX);
-    currentPosition += 1;
-
-    memory.putInt(currentPosition, typeNameBytes.length);
-    currentPosition += Integer.BYTES;
-
-    memory.putByteArray(currentPosition, typeNameBytes, 0, typeNameBytes.length);
-    currentPosition += typeNameBytes.length;
-
-    currentPosition += offsetMemory.writeTo(memory, currentPosition);
-    currentPosition += dataMemory.writeTo(memory, currentPosition);
-
-    return currentPosition - startPosition;
+    return maker.writeTo(memory, startPosition);
   }
 
   @Override
   public void close()
   {
-    offsetMemory.close();
-    dataMemory.close();
-  }
-
-  private int headerSize()
-  {
-    return 1 /* type code */
-           + Integer.BYTES /* type name length */
-           + typeNameBytes.length;
+    maker.close();
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/ComplexFrameMaker.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/ComplexFrameMaker.java
new file mode 100644
index 000000000000..8622a7bce202
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/ComplexFrameMaker.java
@@ -0,0 +1,147 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.frame.write.columnar;
+
+import com.google.common.primitives.Ints;
+import it.unimi.dsi.fastutil.bytes.ByteArrays;
+import org.apache.datasketches.memory.WritableMemory;
+import org.apache.druid.frame.allocation.AppendableMemory;
+import org.apache.druid.frame.allocation.MemoryAllocator;
+import org.apache.druid.frame.allocation.MemoryRange;
+import org.apache.druid.frame.read.columnar.ComplexFrameColumnReader;
+import org.apache.druid.java.util.common.ISE;
+
+/**
+ * Column writer for complex columns.
+ *
+ * Dual to {@link ComplexFrameColumnReader}.
+ */
+public class ComplexFrameMaker
+{
+  // Less than half of AppendableMemory.DEFAULT_INITIAL_ALLOCATION_SIZE.
+  // This guarantees we can fit a WorkerMemoryParmeters.MAX_FRAME_COLUMNS number of columns into a frame.
+  private static final int INITIAL_ALLOCATION_SIZE = 128;
+
+  public static final byte NOT_NULL_MARKER = 0x00;
+  public static final byte NULL_MARKER = 0x01;
+  public static final int TYPE_NAME_LENGTH_POSITION = Byte.BYTES;
+  public static final int TYPE_NAME_POSITION = Byte.BYTES + Integer.BYTES;
+
+  private final AppendableMemory offsetMemory;
+  private final AppendableMemory dataMemory;
+  private final byte[] typeName;
+
+  private int lastDataLength = -1;
+
+  ComplexFrameMaker(
+      final MemoryAllocator allocator,
+      final byte[] typeName
+  )
+  {
+    this.offsetMemory = AppendableMemory.create(allocator, INITIAL_ALLOCATION_SIZE);
+    this.dataMemory = AppendableMemory.create(allocator, INITIAL_ALLOCATION_SIZE);
+    this.typeName = typeName;
+  }
+
+  public boolean add(byte[] bytes)
+  {
+    if (!offsetMemory.reserveAdditional(Integer.BYTES)) {
+      return false;
+    }
+
+    boolean isNull = false;
+    if (bytes == null) {
+      isNull = true;
+      bytes = ByteArrays.EMPTY_ARRAY;
+    }
+
+    if (bytes.length == Integer.MAX_VALUE) {
+      // Cannot handle objects this large.
+      return false;
+    }
+
+    final int dataLength = bytes.length + 1;
+
+    if (dataMemory.size() + dataLength > Integer.MAX_VALUE || !(dataMemory.reserveAdditional(dataLength))) {
+      return false;
+    }
+
+    // All space is reserved. Start writing.
+    final MemoryRange<WritableMemory> offsetCursor = offsetMemory.cursor();
+    offsetCursor.memory().putInt(offsetCursor.start(), Ints.checkedCast(dataMemory.size() + dataLength));
+    offsetMemory.advanceCursor(Integer.BYTES);
+
+    final MemoryRange<WritableMemory> dataCursor = dataMemory.cursor();
+    dataCursor.memory().putByte(dataCursor.start(), isNull ? NULL_MARKER : NOT_NULL_MARKER);
+    dataCursor.memory().putByteArray(dataCursor.start() + 1, bytes, 0, bytes.length);
+    dataMemory.advanceCursor(dataLength);
+
+    lastDataLength = dataLength;
+    return true;
+  }
+
+  public void undo()
+  {
+    if (lastDataLength == -1) {
+      throw new ISE("Nothing to undo");
+    }
+
+    offsetMemory.rewindCursor(Integer.BYTES);
+    dataMemory.rewindCursor(lastDataLength);
+    lastDataLength = -1;
+  }
+
+  public long size()
+  {
+    return headerSize() + offsetMemory.size() + dataMemory.size();
+  }
+
+  public long writeTo(final WritableMemory memory, final long startPosition)
+  {
+    long currentPosition = startPosition;
+
+    memory.putByte(currentPosition, FrameColumnWriters.TYPE_COMPLEX);
+    currentPosition += 1;
+
+    memory.putInt(currentPosition, typeName.length);
+    currentPosition += Integer.BYTES;
+
+    memory.putByteArray(currentPosition, typeName, 0, typeName.length);
+    currentPosition += typeName.length;
+
+    currentPosition += offsetMemory.writeTo(memory, currentPosition);
+    currentPosition += dataMemory.writeTo(memory, currentPosition);
+
+    return currentPosition - startPosition;
+  }
+
+  public void close()
+  {
+    offsetMemory.close();
+    dataMemory.close();
+  }
+
+  private int headerSize()
+  {
+    return 1 /* type code */
+           + Integer.BYTES /* type name length */
+           + typeName.length;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/DoubleFrameColumnWriter.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/DoubleFrameColumnWriter.java
index 82d2054d4029..f83e210ef06d 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/columnar/DoubleFrameColumnWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/DoubleFrameColumnWriter.java
@@ -20,19 +20,13 @@
 package org.apache.druid.frame.write.columnar;
 
 import org.apache.datasketches.memory.WritableMemory;
-import org.apache.druid.frame.allocation.AppendableMemory;
 import org.apache.druid.frame.allocation.MemoryAllocator;
-import org.apache.druid.frame.allocation.MemoryRange;
 import org.apache.druid.segment.BaseDoubleColumnValueSelector;
 
 public class DoubleFrameColumnWriter implements FrameColumnWriter
 {
-  public static final long DATA_OFFSET = 1 /* type code */ + 1 /* has nulls? */;
-
   private final BaseDoubleColumnValueSelector selector;
-  private final AppendableMemory appendableMemory;
-  private final boolean hasNulls;
-  private final int sz;
+  private final DoubleFrameMaker maker;
 
   DoubleFrameColumnWriter(
       BaseDoubleColumnValueSelector selector,
@@ -41,71 +35,40 @@ public class DoubleFrameColumnWriter implements FrameColumnWriter
   )
   {
     this.selector = selector;
-    this.appendableMemory = AppendableMemory.create(allocator);
-    this.hasNulls = hasNulls;
-    this.sz = valueSize(hasNulls);
-  }
-
-  public static int valueSize(final boolean hasNulls)
-  {
-    return hasNulls ? Double.BYTES + 1 : Double.BYTES;
+    this.maker = new DoubleFrameMaker(allocator, hasNulls);
   }
 
   @Override
   public boolean addSelection()
   {
-    if (!(appendableMemory.reserveAdditional(sz))) {
-      return false;
-    }
-
-    final MemoryRange<WritableMemory> cursor = appendableMemory.cursor();
-    final WritableMemory memory = cursor.memory();
-    final long position = cursor.start();
-
-    if (hasNulls) {
-      if (selector.isNull()) {
-        memory.putByte(position, (byte) 1);
-        memory.putDouble(position + 1, 0);
-      } else {
-        memory.putByte(position, (byte) 0);
-        memory.putDouble(position + 1, selector.getDouble());
-      }
+    if (selector.isNull()) {
+      return maker.addNull();
     } else {
-      memory.putDouble(position, selector.getDouble());
+      return maker.add(selector.getDouble());
     }
-
-    appendableMemory.advanceCursor(sz);
-    return true;
   }
 
   @Override
   public void undo()
   {
-    appendableMemory.rewindCursor(sz);
+    maker.undo();
   }
 
   @Override
   public long size()
   {
-    return DATA_OFFSET + appendableMemory.size();
+    return maker.size();
   }
 
   @Override
   public long writeTo(final WritableMemory memory, final long startPosition)
   {
-    long currentPosition = startPosition;
-
-    memory.putByte(currentPosition, FrameColumnWriters.TYPE_DOUBLE);
-    memory.putByte(currentPosition + 1, hasNulls ? (byte) 1 : (byte) 0);
-    currentPosition += 2;
-
-    currentPosition += appendableMemory.writeTo(memory, currentPosition);
-    return currentPosition - startPosition;
+    return maker.writeTo(memory, startPosition);
   }
 
   @Override
   public void close()
   {
-    appendableMemory.close();
+    maker.close();
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/DoubleFrameMaker.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/DoubleFrameMaker.java
new file mode 100644
index 000000000000..13ee53d6d5fc
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/DoubleFrameMaker.java
@@ -0,0 +1,122 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.frame.write.columnar;
+
+import org.apache.datasketches.memory.WritableMemory;
+import org.apache.druid.frame.allocation.AppendableMemory;
+import org.apache.druid.frame.allocation.MemoryAllocator;
+import org.apache.druid.frame.allocation.MemoryRange;
+import org.apache.druid.java.util.common.ISE;
+
+import java.io.Closeable;
+
+public class DoubleFrameMaker implements Closeable
+{
+  public static final long DATA_OFFSET = 1 /* type code */ + 1 /* has nulls? */;
+
+  private final AppendableMemory appendableMemory;
+  private final boolean hasNulls;
+  private final int sz;
+
+  public DoubleFrameMaker(
+      MemoryAllocator allocator,
+      boolean hasNulls
+  )
+  {
+    this.appendableMemory = AppendableMemory.create(allocator);
+    this.hasNulls = hasNulls;
+    this.sz = valueSize(hasNulls);
+  }
+
+  public static int valueSize(final boolean hasNulls)
+  {
+    return hasNulls ? Double.BYTES + 1 : Double.BYTES;
+  }
+
+  public boolean add(double value)
+  {
+    if (!(appendableMemory.reserveAdditional(sz))) {
+      return false;
+    }
+
+    final MemoryRange<WritableMemory> cursor = appendableMemory.cursor();
+    final WritableMemory memory = cursor.memory();
+    final long position = cursor.start();
+
+    if (hasNulls) {
+      memory.putByte(position, (byte) 0);
+      memory.putDouble(position + 1, value);
+    } else {
+      memory.putDouble(position, value);
+    }
+
+    appendableMemory.advanceCursor(sz);
+    return true;
+  }
+
+  public boolean addNull()
+  {
+    if (!hasNulls) {
+      throw new ISE("Was told that null doesn't exist, cannot add null");
+    }
+
+    if (!(appendableMemory.reserveAdditional(sz))) {
+      return false;
+    }
+
+    final MemoryRange<WritableMemory> cursor = appendableMemory.cursor();
+    final WritableMemory memory = cursor.memory();
+    final long position = cursor.start();
+
+    memory.putByte(position, (byte) 1);
+    memory.putDouble(position + 1, 0);
+
+    appendableMemory.advanceCursor(sz);
+    return true;
+  }
+
+  public void undo()
+  {
+    appendableMemory.rewindCursor(sz);
+  }
+
+  public long size()
+  {
+    return DATA_OFFSET + appendableMemory.size();
+  }
+
+  public long writeTo(final WritableMemory memory, final long startPosition)
+  {
+    long currentPosition = startPosition;
+
+    memory.putByte(currentPosition, FrameColumnWriters.TYPE_DOUBLE);
+    memory.putByte(currentPosition + 1, hasNulls ? (byte) 1 : (byte) 0);
+    currentPosition += 2;
+
+    currentPosition += appendableMemory.writeTo(memory, currentPosition);
+    return currentPosition - startPosition;
+  }
+
+  @Override
+  public void close()
+  {
+    appendableMemory.close();
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/FloatFrameColumnWriter.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/FloatFrameColumnWriter.java
index 900b72d2076c..5f7843483d5a 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/columnar/FloatFrameColumnWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/FloatFrameColumnWriter.java
@@ -20,19 +20,13 @@
 package org.apache.druid.frame.write.columnar;
 
 import org.apache.datasketches.memory.WritableMemory;
-import org.apache.druid.frame.allocation.AppendableMemory;
 import org.apache.druid.frame.allocation.MemoryAllocator;
-import org.apache.druid.frame.allocation.MemoryRange;
 import org.apache.druid.segment.BaseFloatColumnValueSelector;
 
 public class FloatFrameColumnWriter implements FrameColumnWriter
 {
-  public static final long DATA_OFFSET = 1 /* type code */ + 1 /* has nulls? */;
-
   private final BaseFloatColumnValueSelector selector;
-  private final AppendableMemory appendableMemory;
-  private final boolean hasNulls;
-  private final int sz;
+  private final FloatFrameMaker maker;
 
   FloatFrameColumnWriter(
       BaseFloatColumnValueSelector selector,
@@ -41,71 +35,40 @@ public class FloatFrameColumnWriter implements FrameColumnWriter
   )
   {
     this.selector = selector;
-    this.appendableMemory = AppendableMemory.create(allocator);
-    this.hasNulls = hasNulls;
-    this.sz = valueSize(hasNulls);
-  }
-
-  public static int valueSize(final boolean hasNulls)
-  {
-    return hasNulls ? Float.BYTES + 1 : Float.BYTES;
+    this.maker = new FloatFrameMaker(allocator, hasNulls);
   }
 
   @Override
   public boolean addSelection()
   {
-    if (!(appendableMemory.reserveAdditional(sz))) {
-      return false;
-    }
-
-    final MemoryRange<WritableMemory> cursor = appendableMemory.cursor();
-    final WritableMemory memory = cursor.memory();
-    final long position = cursor.start();
-
-    if (hasNulls) {
-      if (selector.isNull()) {
-        memory.putByte(position, (byte) 1);
-        memory.putFloat(position + 1, 0);
-      } else {
-        memory.putByte(position, (byte) 0);
-        memory.putFloat(position + 1, selector.getFloat());
-      }
+    if (selector.isNull()) {
+      return maker.addNull();
     } else {
-      memory.putFloat(position, selector.getFloat());
+      return maker.add(selector.getFloat());
     }
-
-    appendableMemory.advanceCursor(sz);
-    return true;
   }
 
   @Override
   public void undo()
   {
-    appendableMemory.rewindCursor(sz);
+    maker.undo();
   }
 
   @Override
   public long size()
   {
-    return DATA_OFFSET + appendableMemory.size();
+    return maker.size();
   }
 
   @Override
   public long writeTo(final WritableMemory memory, final long startPosition)
   {
-    long currentPosition = startPosition;
-
-    memory.putByte(currentPosition, FrameColumnWriters.TYPE_FLOAT);
-    memory.putByte(currentPosition + 1, hasNulls ? (byte) 1 : (byte) 0);
-    currentPosition += 2;
-
-    currentPosition += appendableMemory.writeTo(memory, currentPosition);
-    return currentPosition - startPosition;
+    return maker.writeTo(memory, startPosition);
   }
 
   @Override
   public void close()
   {
-    appendableMemory.close();
+    maker.close();
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/FloatFrameMaker.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/FloatFrameMaker.java
new file mode 100644
index 000000000000..3c299d0b9106
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/FloatFrameMaker.java
@@ -0,0 +1,122 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.frame.write.columnar;
+
+import org.apache.datasketches.memory.WritableMemory;
+import org.apache.druid.frame.allocation.AppendableMemory;
+import org.apache.druid.frame.allocation.MemoryAllocator;
+import org.apache.druid.frame.allocation.MemoryRange;
+import org.apache.druid.java.util.common.ISE;
+
+import java.io.Closeable;
+
+public class FloatFrameMaker implements Closeable
+{
+  public static final long DATA_OFFSET = 1 /* type code */ + 1 /* has nulls? */;
+
+  private final AppendableMemory appendableMemory;
+  private final boolean hasNulls;
+  private final int sz;
+
+  public FloatFrameMaker(
+      MemoryAllocator allocator,
+      boolean hasNulls
+  )
+  {
+    this.appendableMemory = AppendableMemory.create(allocator);
+    this.hasNulls = hasNulls;
+    this.sz = valueSize(hasNulls);
+  }
+
+  public static int valueSize(final boolean hasNulls)
+  {
+    return hasNulls ? Float.BYTES + 1 : Float.BYTES;
+  }
+
+  public boolean add(float value)
+  {
+    if (!(appendableMemory.reserveAdditional(sz))) {
+      return false;
+    }
+
+    final MemoryRange<WritableMemory> cursor = appendableMemory.cursor();
+    final WritableMemory memory = cursor.memory();
+    final long position = cursor.start();
+
+    if (hasNulls) {
+      memory.putByte(position, (byte) 0);
+      memory.putFloat(position + 1, value);
+    } else {
+      memory.putFloat(position, value);
+    }
+
+    appendableMemory.advanceCursor(sz);
+    return true;
+  }
+
+  public boolean addNull()
+  {
+    if (!hasNulls) {
+      throw new ISE("Was told that null doesn't exist, cannot add null");
+    }
+
+    if (!(appendableMemory.reserveAdditional(sz))) {
+      return false;
+    }
+
+    final MemoryRange<WritableMemory> cursor = appendableMemory.cursor();
+    final WritableMemory memory = cursor.memory();
+    final long position = cursor.start();
+
+    memory.putByte(position, (byte) 1);
+    memory.putFloat(position + 1, 0);
+
+    appendableMemory.advanceCursor(sz);
+    return true;
+  }
+
+  public void undo()
+  {
+    appendableMemory.rewindCursor(sz);
+  }
+
+  public long size()
+  {
+    return DATA_OFFSET + appendableMemory.size();
+  }
+
+  public long writeTo(final WritableMemory memory, final long startPosition)
+  {
+    long currentPosition = startPosition;
+
+    memory.putByte(currentPosition, FrameColumnWriters.TYPE_FLOAT);
+    memory.putByte(currentPosition + 1, hasNulls ? (byte) 1 : (byte) 0);
+    currentPosition += 2;
+
+    currentPosition += appendableMemory.writeTo(memory, currentPosition);
+    return currentPosition - startPosition;
+  }
+
+  @Override
+  public void close()
+  {
+    appendableMemory.close();
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/LongFrameColumnWriter.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/LongFrameColumnWriter.java
index c0a2bf4bb3ab..101d36a83a07 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/columnar/LongFrameColumnWriter.java
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/LongFrameColumnWriter.java
@@ -20,19 +20,13 @@
 package org.apache.druid.frame.write.columnar;
 
 import org.apache.datasketches.memory.WritableMemory;
-import org.apache.druid.frame.allocation.AppendableMemory;
 import org.apache.druid.frame.allocation.MemoryAllocator;
-import org.apache.druid.frame.allocation.MemoryRange;
 import org.apache.druid.segment.BaseLongColumnValueSelector;
 
 public class LongFrameColumnWriter implements FrameColumnWriter
 {
-  public static final long DATA_OFFSET = 1 /* type code */ + 1 /* has nulls? */;
-
   private final BaseLongColumnValueSelector selector;
-  private final AppendableMemory appendableMemory;
-  private final boolean hasNulls;
-  private final int sz;
+  private final LongFrameMaker maker;
 
   LongFrameColumnWriter(
       BaseLongColumnValueSelector selector,
@@ -41,71 +35,40 @@ public class LongFrameColumnWriter implements FrameColumnWriter
   )
   {
     this.selector = selector;
-    this.appendableMemory = AppendableMemory.create(allocator);
-    this.hasNulls = hasNulls;
-    this.sz = valueSize(hasNulls);
-  }
-
-  public static int valueSize(final boolean hasNulls)
-  {
-    return hasNulls ? Long.BYTES + 1 : Long.BYTES;
+    this.maker = new LongFrameMaker(allocator, hasNulls);
   }
 
   @Override
   public boolean addSelection()
   {
-    if (!(appendableMemory.reserveAdditional(sz))) {
-      return false;
-    }
-
-    final MemoryRange<WritableMemory> cursor = appendableMemory.cursor();
-    final WritableMemory memory = cursor.memory();
-    final long position = cursor.start();
-
-    if (hasNulls) {
-      if (selector.isNull()) {
-        memory.putByte(position, (byte) 1);
-        memory.putLong(position + 1, 0);
-      } else {
-        memory.putByte(position, (byte) 0);
-        memory.putLong(position + 1, selector.getLong());
-      }
+    if (selector.isNull()) {
+      return maker.addNull();
     } else {
-      memory.putLong(position, selector.getLong());
+      return maker.add(selector.getLong());
     }
-
-    appendableMemory.advanceCursor(sz);
-    return true;
   }
 
   @Override
   public void undo()
   {
-    appendableMemory.rewindCursor(sz);
+    maker.undo();
   }
 
   @Override
   public long size()
   {
-    return DATA_OFFSET + appendableMemory.size();
+    return maker.size();
   }
 
   @Override
   public long writeTo(final WritableMemory memory, final long startPosition)
   {
-    long currentPosition = startPosition;
-
-    memory.putByte(currentPosition, FrameColumnWriters.TYPE_LONG);
-    memory.putByte(currentPosition + 1, hasNulls ? (byte) 1 : (byte) 0);
-    currentPosition += 2;
-
-    currentPosition += appendableMemory.writeTo(memory, currentPosition);
-    return currentPosition - startPosition;
+    return maker.writeTo(memory, startPosition);
   }
 
   @Override
   public void close()
   {
-    appendableMemory.close();
+    maker.close();
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/frame/write/columnar/LongFrameMaker.java b/processing/src/main/java/org/apache/druid/frame/write/columnar/LongFrameMaker.java
new file mode 100644
index 000000000000..54c4e2bc98de
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/frame/write/columnar/LongFrameMaker.java
@@ -0,0 +1,122 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.frame.write.columnar;
+
+import org.apache.datasketches.memory.WritableMemory;
+import org.apache.druid.frame.allocation.AppendableMemory;
+import org.apache.druid.frame.allocation.MemoryAllocator;
+import org.apache.druid.frame.allocation.MemoryRange;
+import org.apache.druid.java.util.common.ISE;
+
+import java.io.Closeable;
+
+public class LongFrameMaker implements Closeable
+{
+  public static final long DATA_OFFSET = 1 /* type code */ + 1 /* has nulls? */;
+
+  private final AppendableMemory appendableMemory;
+  private final boolean hasNulls;
+  private final int sz;
+
+  public LongFrameMaker(
+      MemoryAllocator allocator,
+      boolean hasNulls
+  )
+  {
+    this.appendableMemory = AppendableMemory.create(allocator);
+    this.hasNulls = hasNulls;
+    this.sz = valueSize(hasNulls);
+  }
+
+  public static int valueSize(final boolean hasNulls)
+  {
+    return hasNulls ? Long.BYTES + 1 : Long.BYTES;
+  }
+
+  public boolean add(long value)
+  {
+    if (!(appendableMemory.reserveAdditional(sz))) {
+      return false;
+    }
+
+    final MemoryRange<WritableMemory> cursor = appendableMemory.cursor();
+    final WritableMemory memory = cursor.memory();
+    final long position = cursor.start();
+
+    if (hasNulls) {
+      memory.putByte(position, (byte) 0);
+      memory.putLong(position + 1, value);
+    } else {
+      memory.putLong(position, value);
+    }
+
+    appendableMemory.advanceCursor(sz);
+    return true;
+  }
+
+  public boolean addNull()
+  {
+    if (!hasNulls) {
+      throw new ISE("Was told that null doesn't exist, cannot add null");
+    }
+
+    if (!(appendableMemory.reserveAdditional(sz))) {
+      return false;
+    }
+
+    final MemoryRange<WritableMemory> cursor = appendableMemory.cursor();
+    final WritableMemory memory = cursor.memory();
+    final long position = cursor.start();
+
+    memory.putByte(position, (byte) 1);
+    memory.putLong(position + 1, 0);
+
+    appendableMemory.advanceCursor(sz);
+    return true;
+  }
+
+  public void undo()
+  {
+    appendableMemory.rewindCursor(sz);
+  }
+
+  public long size()
+  {
+    return DATA_OFFSET + appendableMemory.size();
+  }
+
+  public long writeTo(final WritableMemory memory, final long startPosition)
+  {
+    long currentPosition = startPosition;
+
+    memory.putByte(currentPosition, FrameColumnWriters.TYPE_LONG);
+    memory.putByte(currentPosition + 1, hasNulls ? (byte) 1 : (byte) 0);
+    currentPosition += 2;
+
+    currentPosition += appendableMemory.writeTo(memory, currentPosition);
+    return currentPosition - startPosition;
+  }
+
+  @Override
+  public void close()
+  {
+    appendableMemory.close();
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/guice/ExtensionsConfig.java b/processing/src/main/java/org/apache/druid/guice/ExtensionsConfig.java
index c48d27eb588e..3af3db347aa1 100644
--- a/processing/src/main/java/org/apache/druid/guice/ExtensionsConfig.java
+++ b/processing/src/main/java/org/apache/druid/guice/ExtensionsConfig.java
@@ -28,6 +28,8 @@
  */
 public class ExtensionsConfig
 {
+  public static final String PROPERTY_BASE = "druid.extensions";
+
   @JsonProperty
   @NotNull
   private boolean searchCurrentClassloader = true;
diff --git a/processing/src/main/java/org/apache/druid/guice/ExtensionsLoader.java b/processing/src/main/java/org/apache/druid/guice/ExtensionsLoader.java
index b76bcb9a2cb4..0d3b035e7a6a 100644
--- a/processing/src/main/java/org/apache/druid/guice/ExtensionsLoader.java
+++ b/processing/src/main/java/org/apache/druid/guice/ExtensionsLoader.java
@@ -55,6 +55,7 @@
  * any kind of extension that may be needed in the future.
  * The extensions are cached so that they can be reported by various REST APIs.
  */
+@LazySingleton
 public class ExtensionsLoader
 {
   private static final Logger log = new Logger(ExtensionsLoader.class);
diff --git a/processing/src/main/java/org/apache/druid/guice/ExtensionsModule.java b/processing/src/main/java/org/apache/druid/guice/ExtensionsModule.java
index 070bbc152ebf..74be479c2beb 100644
--- a/processing/src/main/java/org/apache/druid/guice/ExtensionsModule.java
+++ b/processing/src/main/java/org/apache/druid/guice/ExtensionsModule.java
@@ -35,8 +35,8 @@ public class ExtensionsModule implements Module
   public void configure(Binder binder)
   {
     binder.bind(ExtensionsLoader.class).in(LazySingleton.class);
-    JsonConfigProvider.bind(binder, "druid.extensions", ExtensionsConfig.class);
-    JsonConfigProvider.bind(binder, "druid.modules", ModulesConfig.class);
+    JsonConfigProvider.bind(binder, ExtensionsConfig.PROPERTY_BASE, ExtensionsConfig.class);
+    JsonConfigProvider.bind(binder, ModulesConfig.PROPERTY_BASE, ModulesConfig.class);
   }
 
   /**
diff --git a/processing/src/main/java/org/apache/druid/guice/ModulesConfig.java b/processing/src/main/java/org/apache/druid/guice/ModulesConfig.java
index 5ff8dee917bf..e7b69c4960a9 100644
--- a/processing/src/main/java/org/apache/druid/guice/ModulesConfig.java
+++ b/processing/src/main/java/org/apache/druid/guice/ModulesConfig.java
@@ -26,6 +26,8 @@
 
 public class ModulesConfig
 {
+  public static final String PROPERTY_BASE = "druid.modules";
+
   /**
    * Canonical class names of modules, which should not be loaded despite they are founded in extensions from {@link
    * ExtensionsConfig#loadList} or the standard list of modules loaded by some node type, e. g. {@code
diff --git a/processing/src/main/java/org/apache/druid/guice/StartupInjectorBuilder.java b/processing/src/main/java/org/apache/druid/guice/StartupInjectorBuilder.java
index 13d116b60071..e091e6eb5229 100644
--- a/processing/src/main/java/org/apache/druid/guice/StartupInjectorBuilder.java
+++ b/processing/src/main/java/org/apache/druid/guice/StartupInjectorBuilder.java
@@ -19,8 +19,10 @@
 
 package org.apache.druid.guice;
 
+import com.google.inject.util.Providers;
 import org.apache.druid.jackson.JacksonModule;
 import org.apache.druid.math.expr.ExpressionProcessingModule;
+import org.apache.druid.utils.RuntimeInfo;
 
 import java.util.Arrays;
 import java.util.Properties;
@@ -80,4 +82,19 @@ public StartupInjectorBuilder forServer()
     );
     return this;
   }
+
+  /**
+   * Configure the injector to not load server-only classes by binding those
+   * classes to providers of null values. Avoids accidental dependencies of
+   * test code on classes not intended for classes by preventing Guice from
+   * helpfully providing implicit instances.
+   */
+  public StartupInjectorBuilder forTests()
+  {
+    add(binder -> {
+      binder.bind(ExtensionsLoader.class).toProvider(Providers.of(null));
+      binder.bind(RuntimeInfo.class).toProvider(Providers.of(null));
+    });
+    return this;
+  }
 }
diff --git a/processing/src/main/java/org/apache/druid/jackson/DefaultObjectMapper.java b/processing/src/main/java/org/apache/druid/jackson/DefaultObjectMapper.java
index ac9387b11ef6..7e530836c2f7 100644
--- a/processing/src/main/java/org/apache/druid/jackson/DefaultObjectMapper.java
+++ b/processing/src/main/java/org/apache/druid/jackson/DefaultObjectMapper.java
@@ -42,6 +42,8 @@
  */
 public class DefaultObjectMapper extends ObjectMapper
 {
+  public static final DefaultObjectMapper INSTANCE = new DefaultObjectMapper();
+
   public DefaultObjectMapper()
   {
     this((JsonFactory) null, null);
diff --git a/processing/src/main/java/org/apache/druid/query/DataSource.java b/processing/src/main/java/org/apache/druid/query/DataSource.java
index f56a3550a34b..43dfb3be85c8 100644
--- a/processing/src/main/java/org/apache/druid/query/DataSource.java
+++ b/processing/src/main/java/org/apache/druid/query/DataSource.java
@@ -41,7 +41,8 @@
     @JsonSubTypes.Type(value = JoinDataSource.class, name = "join"),
     @JsonSubTypes.Type(value = LookupDataSource.class, name = "lookup"),
     @JsonSubTypes.Type(value = InlineDataSource.class, name = "inline"),
-    @JsonSubTypes.Type(value = GlobalTableDataSource.class, name = "globalTable")
+    @JsonSubTypes.Type(value = GlobalTableDataSource.class, name = "globalTable"),
+    @JsonSubTypes.Type(value = UnnestDataSource.class, name = "unnest")
 })
 public interface DataSource
 {
diff --git a/processing/src/main/java/org/apache/druid/query/DefaultQueryMetrics.java b/processing/src/main/java/org/apache/druid/query/DefaultQueryMetrics.java
index 441b36d5bb50..6cab0252e7f7 100644
--- a/processing/src/main/java/org/apache/druid/query/DefaultQueryMetrics.java
+++ b/processing/src/main/java/org/apache/druid/query/DefaultQueryMetrics.java
@@ -352,6 +352,27 @@ public QueryMetrics<QueryType> reportParallelMergeTotalCpuTime(long timeNs)
     return this;
   }
 
+  @Override
+  public QueryMetrics<QueryType> reportParallelMergeTotalTime(long timeNs)
+  {
+    // Don't emit by default.
+    return this;
+  }
+
+  @Override
+  public QueryMetrics<QueryType> reportParallelMergeFastestPartitionTime(long timeNs)
+  {
+    // Don't emit by default.
+    return this;
+  }
+
+  @Override
+  public QueryMetrics<QueryType> reportParallelMergeSlowestPartitionTime(long timeNs)
+  {
+    // Don't emit by default.
+    return this;
+  }
+
   @Override
   public QueryMetrics<QueryType> reportQueriedSegmentCount(long segmentCount)
   {
diff --git a/processing/src/main/java/org/apache/druid/query/InlineDataSource.java b/processing/src/main/java/org/apache/druid/query/InlineDataSource.java
index 040d6885782a..b3c602403913 100644
--- a/processing/src/main/java/org/apache/druid/query/InlineDataSource.java
+++ b/processing/src/main/java/org/apache/druid/query/InlineDataSource.java
@@ -32,6 +32,7 @@
 import org.apache.druid.segment.column.RowSignature;
 
 import javax.annotation.Nullable;
+import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.List;
@@ -70,7 +71,7 @@ private InlineDataSource(
   private static InlineDataSource fromJson(
       @JsonProperty("columnNames") List<String> columnNames,
       @JsonProperty("columnTypes") List<ColumnType> columnTypes,
-      @JsonProperty("rows") List<Object[]> rows
+      @JsonProperty("rows") ArrayList<Object[]> rows
   )
   {
     Preconditions.checkNotNull(columnNames, "'columnNames' must be nonnull");
@@ -200,6 +201,11 @@ public Iterable<Object[]> getRows()
     return rows;
   }
 
+  public boolean rowsAreArrayList()
+  {
+    return rows instanceof ArrayList;
+  }
+
   @Override
   public List<DataSource> getChildren()
   {
diff --git a/processing/src/main/java/org/apache/druid/query/Query.java b/processing/src/main/java/org/apache/druid/query/Query.java
index 9d38dbe37169..90b43469dce5 100644
--- a/processing/src/main/java/org/apache/druid/query/Query.java
+++ b/processing/src/main/java/org/apache/druid/query/Query.java
@@ -31,6 +31,7 @@
 import org.apache.druid.query.filter.DimFilter;
 import org.apache.druid.query.groupby.GroupByQuery;
 import org.apache.druid.query.metadata.metadata.SegmentMetadataQuery;
+import org.apache.druid.query.operator.WindowOperatorQuery;
 import org.apache.druid.query.scan.ScanQuery;
 import org.apache.druid.query.search.SearchQuery;
 import org.apache.druid.query.select.SelectQuery;
@@ -45,7 +46,6 @@
 import org.joda.time.Interval;
 
 import javax.annotation.Nullable;
-
 import java.util.List;
 import java.util.Map;
 import java.util.Set;
@@ -54,27 +54,29 @@
 @ExtensionPoint
 @JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "queryType")
 @JsonSubTypes(value = {
-    @JsonSubTypes.Type(name = Query.TIMESERIES, value = TimeseriesQuery.class),
-    @JsonSubTypes.Type(name = Query.SEARCH, value = SearchQuery.class),
-    @JsonSubTypes.Type(name = Query.TIME_BOUNDARY, value = TimeBoundaryQuery.class),
+    @JsonSubTypes.Type(name = Query.DATASOURCE_METADATA, value = DataSourceMetadataQuery.class),
     @JsonSubTypes.Type(name = Query.GROUP_BY, value = GroupByQuery.class),
     @JsonSubTypes.Type(name = Query.SCAN, value = ScanQuery.class),
+    @JsonSubTypes.Type(name = Query.SEARCH, value = SearchQuery.class),
     @JsonSubTypes.Type(name = Query.SEGMENT_METADATA, value = SegmentMetadataQuery.class),
     @JsonSubTypes.Type(name = Query.SELECT, value = SelectQuery.class),
+    @JsonSubTypes.Type(name = Query.TIME_BOUNDARY, value = TimeBoundaryQuery.class),
+    @JsonSubTypes.Type(name = Query.TIMESERIES, value = TimeseriesQuery.class),
     @JsonSubTypes.Type(name = Query.TOPN, value = TopNQuery.class),
-    @JsonSubTypes.Type(name = Query.DATASOURCE_METADATA, value = DataSourceMetadataQuery.class)
+    @JsonSubTypes.Type(name = Query.WINDOW_OPERATOR, value = WindowOperatorQuery.class),
 })
 public interface Query<T>
 {
-  String TIMESERIES = "timeseries";
-  String SEARCH = "search";
-  String TIME_BOUNDARY = "timeBoundary";
+  String DATASOURCE_METADATA = "dataSourceMetadata";
   String GROUP_BY = "groupBy";
   String SCAN = "scan";
+  String SEARCH = "search";
   String SEGMENT_METADATA = "segmentMetadata";
   String SELECT = "select";
+  String TIME_BOUNDARY = "timeBoundary";
+  String TIMESERIES = "timeseries";
   String TOPN = "topN";
-  String DATASOURCE_METADATA = "dataSourceMetadata";
+  String WINDOW_OPERATOR = "windowOperator";
 
   DataSource getDataSource();
 
diff --git a/processing/src/main/java/org/apache/druid/query/QueryMetrics.java b/processing/src/main/java/org/apache/druid/query/QueryMetrics.java
index f4d71060bf76..ddbcfc0ed53b 100644
--- a/processing/src/main/java/org/apache/druid/query/QueryMetrics.java
+++ b/processing/src/main/java/org/apache/druid/query/QueryMetrics.java
@@ -396,6 +396,30 @@ public interface QueryMetrics<QueryType extends Query<?>>
    */
   QueryMetrics<QueryType> reportParallelMergeTotalCpuTime(long timeNs);
 
+  /**
+   * Reports broker total "wall" time in nanoseconds from parallel merge start sequence creation to total
+   * consumption.
+   */
+  QueryMetrics<QueryType> reportParallelMergeTotalTime(long timeNs);
+
+  /**
+   * Reports broker "wall" time in nanoseconds for the fastest parallel merge sequence partition to be 'initialized',
+   * where 'initialized' is time to the first result batch is populated from data servers and merging can begin.
+   *
+   * Similar to query 'time to first byte' metrics, except is a composite of the whole group of data servers which are
+   * present in the merge partition, which all must supply an initial result batch before merging can actually begin.
+   */
+  QueryMetrics<QueryType> reportParallelMergeFastestPartitionTime(long timeNs);
+
+  /**
+   * Reports broker "wall" time in nanoseconds for the slowest parallel merge sequence partition to be 'initialized',
+   * where 'initialized' is time to the first result batch is populated from data servers and merging can begin.
+   *
+   * Similar to query 'time to first byte' metrics, except is a composite of the whole group of data servers which are
+   * present in the merge partition, which all must supply an initial result batch before merging can actually begin.
+   */
+  QueryMetrics<QueryType> reportParallelMergeSlowestPartitionTime(long timeNs);
+
   /**
    * Emits all metrics, registered since the last {@code emit()} call on this QueryMetrics object.
    */
diff --git a/processing/src/main/java/org/apache/druid/query/UnnestDataSource.java b/processing/src/main/java/org/apache/druid/query/UnnestDataSource.java
new file mode 100644
index 000000000000..46237016743f
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/UnnestDataSource.java
@@ -0,0 +1,212 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import com.google.common.collect.ImmutableList;
+import org.apache.druid.java.util.common.IAE;
+import org.apache.druid.segment.SegmentReference;
+import org.apache.druid.segment.UnnestSegmentReference;
+import org.apache.druid.utils.JvmUtils;
+
+import javax.annotation.Nullable;
+import java.util.LinkedHashSet;
+import java.util.List;
+import java.util.Objects;
+import java.util.Set;
+import java.util.concurrent.atomic.AtomicLong;
+import java.util.function.Function;
+
+/**
+ * The data source for representing an unnest operation.
+ *
+ * An unnest data source has the following:
+ * a base data source which is to be unnested
+ * the column name of the MVD which will be unnested
+ * the name of the column that will hold the unnested values
+ * and an allowlist serving as a filter of which values in the MVD will be unnested.
+ */
+public class UnnestDataSource implements DataSource
+{
+  private final DataSource base;
+  private final String column;
+  private final String outputName;
+  private final LinkedHashSet<String> allowList;
+
+  private UnnestDataSource(
+      DataSource dataSource,
+      String columnName,
+      String outputName,
+      LinkedHashSet<String> allowList
+  )
+  {
+    this.base = dataSource;
+    this.column = columnName;
+    this.outputName = outputName;
+    this.allowList = allowList;
+  }
+
+  @JsonCreator
+  public static UnnestDataSource create(
+      @JsonProperty("base") DataSource base,
+      @JsonProperty("column") String columnName,
+      @JsonProperty("outputName") String outputName,
+      @Nullable @JsonProperty("allowList") LinkedHashSet<String> allowList
+  )
+  {
+    return new UnnestDataSource(base, columnName, outputName, allowList);
+  }
+
+  @JsonProperty("base")
+  public DataSource getBase()
+  {
+    return base;
+  }
+
+  @JsonProperty("column")
+  public String getColumn()
+  {
+    return column;
+  }
+
+  @JsonProperty("outputName")
+  public String getOutputName()
+  {
+    return outputName;
+  }
+
+  @JsonProperty("allowList")
+  public LinkedHashSet<String> getAllowList()
+  {
+    return allowList;
+  }
+
+  @Override
+  public Set<String> getTableNames()
+  {
+    return base.getTableNames();
+  }
+
+  @Override
+  public List<DataSource> getChildren()
+  {
+    return ImmutableList.of(base);
+  }
+
+  @Override
+  public DataSource withChildren(List<DataSource> children)
+  {
+    if (children.size() != 1) {
+      throw new IAE("Expected [1] child, got [%d]", children.size());
+    }
+    return new UnnestDataSource(children.get(0), column, outputName, allowList);
+  }
+
+  @Override
+  public boolean isCacheable(boolean isBroker)
+  {
+    return false;
+  }
+
+  @Override
+  public boolean isGlobal()
+  {
+    return base.isGlobal();
+  }
+
+  @Override
+  public boolean isConcrete()
+  {
+    return base.isConcrete();
+  }
+
+  @Override
+  public Function<SegmentReference, SegmentReference> createSegmentMapFunction(
+      Query query,
+      AtomicLong cpuTimeAccumulator
+  )
+  {
+    final Function<SegmentReference, SegmentReference> segmentMapFn = base.createSegmentMapFunction(
+        query,
+        cpuTimeAccumulator
+    );
+    return JvmUtils.safeAccumulateThreadCpuTime(
+        cpuTimeAccumulator,
+        () -> {
+          if (column == null) {
+            return segmentMapFn;
+          } else if (column.isEmpty()) {
+            return segmentMapFn;
+          } else {
+            return
+                baseSegment ->
+                    new UnnestSegmentReference(
+                        segmentMapFn.apply(baseSegment),
+                        column,
+                        outputName,
+                        allowList
+                    );
+          }
+        }
+    );
+
+  }
+
+  @Override
+  public DataSource withUpdatedDataSource(DataSource newSource)
+  {
+    return new UnnestDataSource(newSource, column, outputName, allowList);
+  }
+
+  @Override
+  public byte[] getCacheKey()
+  {
+    // The column being unnested would need to be part of the cache key
+    // as the results are dependent on what column is being unnested.
+    // Currently, it is not cacheable.
+    // Future development should use the table name and column came to
+    // create an appropriate cac
+    return null;
+  }
+
+  @Override
+  public boolean equals(Object o)
+  {
+    if (this == o) {
+      return true;
+    }
+    if (o == null || getClass() != o.getClass()) {
+      return false;
+    }
+    UnnestDataSource that = (UnnestDataSource) o;
+    return column.equals(that.column)
+           && outputName.equals(that.outputName)
+           && base.equals(that.base);
+  }
+
+  @Override
+  public int hashCode()
+  {
+    return Objects.hash(base, column, outputName);
+  }
+}
+
+
diff --git a/processing/src/main/java/org/apache/druid/query/operator/LimitedRowsAndColumns.java b/processing/src/main/java/org/apache/druid/query/operator/LimitedRowsAndColumns.java
new file mode 100644
index 000000000000..d0521dbad0ba
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/LimitedRowsAndColumns.java
@@ -0,0 +1,115 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.operator.window.value.ShiftedColumnAccessorBase;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+
+import javax.annotation.Nullable;
+import java.util.Collection;
+
+public class LimitedRowsAndColumns implements RowsAndColumns
+{
+  private final RowsAndColumns rac;
+  private final int start;
+  private final int end;
+
+  public LimitedRowsAndColumns(RowsAndColumns rac, int start, int end)
+  {
+    final int numRows = rac.numRows();
+    if (numRows < end) {
+      throw new ISE("end[%d] is out of bounds, cannot be greater than numRows[%d]", end, numRows);
+    }
+
+    this.rac = rac;
+    this.start = start;
+    this.end = end;
+  }
+
+  @Override
+  public Collection<String> getColumnNames()
+  {
+    return rac.getColumnNames();
+  }
+
+  @Override
+  public int numRows()
+  {
+    return end - start;
+  }
+
+  @Override
+  public Column findColumn(String name)
+  {
+    final Column column = rac.findColumn(name);
+    if (column == null) {
+      return null;
+    }
+
+    return new Column()
+    {
+      @Override
+      public ColumnAccessor toAccessor()
+      {
+        final ColumnAccessor columnAccessor = column.toAccessor();
+        return new ShiftedColumnAccessorBase(columnAccessor)
+        {
+          @Override
+          public int numRows()
+          {
+            return end - start;
+          }
+
+          @Override
+          protected int getActualCell(int cell)
+          {
+            int retVal = start + cell;
+            if (retVal >= end) {
+              throw new ISE("Index out of bounds[%d] >= [%d], start[%s]", retVal, end, start);
+            }
+            return retVal;
+          }
+
+          @Override
+          protected boolean outsideBounds(int cell)
+          {
+            return false;
+          }
+        };
+      }
+
+      @Override
+      public <T> T as(Class<? extends T> clazz)
+      {
+        return null;
+      }
+    };
+  }
+
+  @Nullable
+  @Override
+  public <T> T as(Class<T> clazz)
+  {
+    return null;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/NaivePartitioningOperator.java b/processing/src/main/java/org/apache/druid/query/operator/NaivePartitioningOperator.java
new file mode 100644
index 000000000000..8063a78b5984
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/NaivePartitioningOperator.java
@@ -0,0 +1,100 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.rowsandcols.DefaultSortedGroupPartitioner;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.SortedGroupPartitioner;
+
+import java.util.Iterator;
+import java.util.List;
+
+/**
+ * This naive partitioning operator assumes that it's child operator always gives it RowsAndColumns objects that are
+ * a superset of the partitions that it needs to provide.  It will never attempt to make a partition larger than a
+ * single RowsAndColumns object that it is given from its child Operator.  A different operator should be used
+ * if that is an important bit of functionality to have.
+ * <p>
+ * Additionally, this assumes that data has been pre-sorted according to the partitioning columns.  If it is
+ * given data that has not been pre-sorted, an exception is expected to be thrown.
+ */
+public class NaivePartitioningOperator implements Operator
+{
+  private final List<String> partitionColumns;
+  private final Operator child;
+
+  private Iterator<RowsAndColumns> partitionsIter;
+
+  public NaivePartitioningOperator(
+      List<String> partitionColumns,
+      Operator child
+  )
+  {
+    this.partitionColumns = partitionColumns;
+    this.child = child;
+  }
+
+  @Override
+  public void open()
+  {
+    child.open();
+  }
+
+  @Override
+  public RowsAndColumns next()
+  {
+    if (partitionsIter != null && partitionsIter.hasNext()) {
+      return partitionsIter.next();
+    }
+
+    if (child.hasNext()) {
+      final RowsAndColumns rac = child.next();
+
+      SortedGroupPartitioner groupPartitioner = rac.as(SortedGroupPartitioner.class);
+      if (groupPartitioner == null) {
+        groupPartitioner = new DefaultSortedGroupPartitioner(rac);
+      }
+
+      partitionsIter = groupPartitioner.partitionOnBoundaries(partitionColumns).iterator();
+      return partitionsIter.next();
+    }
+
+    throw new ISE("Asked for next when already complete");
+  }
+
+  @Override
+  public boolean hasNext()
+  {
+    if (partitionsIter != null && partitionsIter.hasNext()) {
+      return true;
+    }
+
+    return child.hasNext();
+  }
+
+  @Override
+  public void close(boolean cascade)
+  {
+    if (cascade) {
+      child.close(cascade);
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/NaivePartitioningOperatorFactory.java b/processing/src/main/java/org/apache/druid/query/operator/NaivePartitioningOperatorFactory.java
new file mode 100644
index 000000000000..9bd937ab8443
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/NaivePartitioningOperatorFactory.java
@@ -0,0 +1,68 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+
+import java.util.ArrayList;
+import java.util.List;
+
+public class NaivePartitioningOperatorFactory implements OperatorFactory
+{
+  private final List<String> partitionColumns;
+
+  @JsonCreator
+  public NaivePartitioningOperatorFactory(
+      @JsonProperty("partitionColumns") List<String> partitionColumns
+  )
+  {
+    this.partitionColumns = partitionColumns == null ? new ArrayList<>() : partitionColumns;
+  }
+
+  @JsonProperty("partitionColumns")
+  public List<String> getPartitionColumns()
+  {
+    return partitionColumns;
+  }
+
+  @Override
+  public Operator wrap(Operator op)
+  {
+    return new NaivePartitioningOperator(partitionColumns, op);
+  }
+
+  @Override
+  public boolean validateEquivalent(OperatorFactory other)
+  {
+    if (other instanceof NaivePartitioningOperatorFactory) {
+      return partitionColumns.equals(((NaivePartitioningOperatorFactory) other).getPartitionColumns());
+    }
+    return false;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "NaivePartitioningOperatorFactory{" +
+           "partitionColumns=" + partitionColumns +
+           '}';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/Operator.java b/processing/src/main/java/org/apache/druid/query/operator/Operator.java
new file mode 100644
index 000000000000..ad64cd1a5235
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/Operator.java
@@ -0,0 +1,93 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+
+/**
+ * An Operator interface that intends to align closely with the Operators that other databases would also tend
+ * to be implemented using.
+ * <p>
+ * The lifecycle of an operator is that, after creation, it should be opened, and then iterated using hasNext() and
+ * next().  Finally, when the Operator is no longer useful, it should be closed.
+ * <p>
+ * Operator's methods mimic the methods of an {@code Iterator}, but it does not implement {@code Iterator}
+ * intentionally.  An operator should never be wrapped in an {@code Iterator}.  Any code that does that should be
+ * considered a bug and fixed.  This is for two reasons:
+ * <p>
+ * 1. An Operator should never be passed around as an {@code Iterator}.  An Operator must be closed, if an operator
+ * gets returned as an {@code Iterator}, the code that sees the {@code Iterator} loses the knowledge that it's
+ * dealing with an Operator and might not close it.  Even something like a {@code CloseableIterator} is an
+ * anti-pattern as it's possible to use it in a functional manner with code that loses track of the fact that it
+ * must be closed.
+ * 2. To avoid "fluent" style composition of functions on Operators.  It is important that there never be a set of
+ * functional primitives for things like map/filter/reduce to "simplify" the implementation of Operators.  This is
+ * because such fluency produces really hard to decipher stack traces as the stacktrace ends up being just a bunch
+ * of calls from the scaffolding (map/filter/reduce) and not from the actual Operator itself.  By not implementing
+ * {@code Iterator} we are actively increasing the burden of trying to add such functional operations to the point
+ * that hopefully, though code review, we can ensure that we never develop them.  It is infinitely better to preserve
+ * the stacktrace and "duplicate" the map/filter/reduce scaffolding code.
+ */
+public interface Operator
+{
+  /**
+   * Called to initiate the lifecycle of the Operator.  If an operator needs to checkout resources or anything to do
+   * its work, this is probably the place to do it.
+   *
+   * Work should *never* be done in this method, this method only exists to acquire resources that are known to be
+   * needed before doing any work.  As a litmus test, if there is ever a call to `op.next()` inside of this method,
+   * then something has been done wrong as that call to `.next()` is actually doing work.  Such code should be moved
+   * into being lazily evaluated as part of a call to `.next()`.
+   */
+  void open();
+
+  /**
+   * Returns the next RowsAndColumns object that the Operator can produce.  Behavior is undefined if
+   * {@link #hasNext} returns false.
+   *
+   * @return the next RowsAndColumns object that the operator can produce
+   */
+  RowsAndColumns next();
+
+  /**
+   * Used to identify if it is safe to call {@link #next}
+   *
+   * @return true if it is safe to call {@link #next}
+   */
+  boolean hasNext();
+
+  /**
+   * Closes this Operator.  The cascade flag can be used to identify that the intent is to close this operator
+   * and only this operator without actually closing child operators.  Other databases us this sort of functionality
+   * with a planner that is watching over all of the objects and force-closes even if they were closed during normal
+   * operations.  In Druid, in the data pipeline where this was introduced, we are guaranteed to always have close
+   * called regardless of errors or exceptions during processing, as such, at time of introduction, there is no
+   * call that passes false for cascade.
+   * <p>
+   * That said, given that this is a common thing for these interfaces for other databases, we want to preserve the
+   * optionality of being able to leverage what they do.  As such, we define the method this way with the belief
+   * that it might be used in the future.  Semantically, this means that all implementations of Operators must
+   * expect to be closed multiple times.  I.e. after being closed, it is an error for open, next or hasNext to be
+   * called, but close can be called any number of times.
+   *
+   * @param cascade whether to call close on child operators.
+   */
+  void close(boolean cascade);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/OperatorFactory.java b/processing/src/main/java/org/apache/druid/query/operator/OperatorFactory.java
new file mode 100644
index 000000000000..26235c35d8d8
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/OperatorFactory.java
@@ -0,0 +1,59 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.fasterxml.jackson.annotation.JsonSubTypes;
+import com.fasterxml.jackson.annotation.JsonTypeInfo;
+
+/**
+ * A factory for Operators.  This class exists to encapsulate the user-definition of an Operator. I.e. which operator,
+ * what fields it should operate on, etc. etc.  These Factory objects are then used to combine Operators together
+ * and run against concrete data.
+ */
+@JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type")
+@JsonSubTypes(value = {
+    @JsonSubTypes.Type(name = "naivePartition", value = NaivePartitioningOperatorFactory.class),
+    @JsonSubTypes.Type(name = "window", value = WindowOperatorFactory.class),
+})
+public interface OperatorFactory
+{
+  /**
+   * Builds an operator according to the definition of the OperatorFactory and wraps it around the operator passed
+   * in to this function.
+   *
+   * @param op the Operator to wrap
+   * @return the wrapped Operator
+   */
+  Operator wrap(Operator op);
+
+  /**
+   * Validates the equivalence of Operators.  This is similar to @{code .equals} but is its own method
+   * so that it can ignore certain fields that would be important for a true equality check.  Namely, two Operators
+   * defined the same way but with different output names can be considered equivalent even though they are not equal.
+   * <p>
+   * This primarily exists to simplify tests, where this equivalence can be used to validate that the Operators
+   * created by the SQL planner are actually equivalent to what we expect without needing to be overly dependent on
+   * how the planner names output columns
+   *
+   * @param other the processor to test equivalence of
+   * @return boolean identifying if these processors should be considered equivalent to each other.
+   */
+  boolean validateEquivalent(OperatorFactory other);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/OperatorSequence.java b/processing/src/main/java/org/apache/druid/query/operator/OperatorSequence.java
new file mode 100644
index 000000000000..45a3bbd23899
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/OperatorSequence.java
@@ -0,0 +1,125 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import org.apache.druid.java.util.common.guava.Accumulator;
+import org.apache.druid.java.util.common.guava.Sequence;
+import org.apache.druid.java.util.common.guava.Yielder;
+import org.apache.druid.java.util.common.guava.Yielders;
+import org.apache.druid.java.util.common.guava.YieldingAccumulator;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+
+import java.util.function.Supplier;
+
+public class OperatorSequence implements Sequence<RowsAndColumns>
+{
+  private final Supplier<Operator> opSupplier;
+
+  public OperatorSequence(
+      Supplier<Operator> opSupplier
+  )
+  {
+    this.opSupplier = opSupplier;
+  }
+
+  @Override
+  public <OutType> OutType accumulate(
+      OutType initValue,
+      Accumulator<OutType, RowsAndColumns> accumulator
+  )
+  {
+    Operator op = null;
+    try {
+      op = opSupplier.get();
+      op.open();
+      while (op.hasNext()) {
+        initValue = accumulator.accumulate(initValue, op.next());
+      }
+      return initValue;
+    }
+    finally {
+      if (op != null) {
+        op.close(true);
+      }
+    }
+  }
+
+  @Override
+  public <OutType> Yielder<OutType> toYielder(
+      OutType initValue,
+      YieldingAccumulator<OutType, RowsAndColumns> accumulator
+  )
+  {
+    final Operator op = opSupplier.get();
+    try {
+      op.open();
+
+      while (!accumulator.yielded() && op.hasNext()) {
+        initValue = accumulator.accumulate(initValue, op.next());
+      }
+      if (accumulator.yielded()) {
+        OutType finalInitValue = initValue;
+        return new Yielder<OutType>()
+        {
+          private OutType retVal = finalInitValue;
+          private boolean done = false;
+
+          @Override
+          public OutType get()
+          {
+            return retVal;
+          }
+
+          @Override
+          public Yielder<OutType> next(OutType initValue)
+          {
+            accumulator.reset();
+            retVal = initValue;
+            while (!accumulator.yielded() && op.hasNext()) {
+              retVal = accumulator.accumulate(retVal, op.next());
+            }
+            if (!accumulator.yielded()) {
+              done = true;
+            }
+            return this;
+          }
+
+          @Override
+          public boolean isDone()
+          {
+            return done;
+          }
+
+          @Override
+          public void close()
+          {
+            op.close(true);
+          }
+        };
+      } else {
+        return Yielders.done(initValue, () -> op.close(true));
+      }
+    }
+    catch (RuntimeException e) {
+      op.close(true);
+      throw e;
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/SegmentToRowsAndColumnsOperator.java b/processing/src/main/java/org/apache/druid/query/operator/SegmentToRowsAndColumnsOperator.java
new file mode 100644
index 000000000000..dc912bfdd6f6
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/SegmentToRowsAndColumnsOperator.java
@@ -0,0 +1,68 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.segment.Segment;
+
+public class SegmentToRowsAndColumnsOperator implements Operator
+{
+  private final Segment segment;
+  private boolean hasNext = true;
+
+  public SegmentToRowsAndColumnsOperator(
+      Segment segment
+  )
+  {
+    this.segment = segment;
+  }
+
+  @Override
+  public void open()
+  {
+
+  }
+
+  @Override
+  public RowsAndColumns next()
+  {
+    hasNext = false;
+
+    RowsAndColumns rac = segment.as(RowsAndColumns.class);
+    if (rac != null) {
+      return rac;
+    }
+
+    throw new ISE("Cannot work with segment of type[%s]", segment.getClass());
+  }
+
+  @Override
+  public boolean hasNext()
+  {
+    return hasNext;
+  }
+
+  @Override
+  public void close(boolean cascade)
+  {
+
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/SequenceOperator.java b/processing/src/main/java/org/apache/druid/query/operator/SequenceOperator.java
new file mode 100644
index 000000000000..9dc54f9576c8
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/SequenceOperator.java
@@ -0,0 +1,87 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.RE;
+import org.apache.druid.java.util.common.guava.Sequence;
+import org.apache.druid.java.util.common.guava.Yielder;
+import org.apache.druid.java.util.common.guava.Yielders;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+
+import java.io.IOException;
+import java.util.NoSuchElementException;
+
+public class SequenceOperator implements Operator
+{
+  private final Sequence<RowsAndColumns> child;
+  private Yielder<RowsAndColumns> yielder;
+  private boolean closed = false;
+
+  public SequenceOperator(
+      Sequence<RowsAndColumns> child
+  )
+  {
+    this.child = child;
+  }
+
+  @Override
+  public void open()
+  {
+    if (closed) {
+      throw new ISE("Operator closed, cannot be re-opened");
+    }
+    yielder = Yielders.each(child);
+  }
+
+  @Override
+  public RowsAndColumns next()
+  {
+    if (closed) {
+      throw new NoSuchElementException();
+    }
+    final RowsAndColumns retVal = yielder.get();
+    yielder = yielder.next(null);
+    return retVal;
+  }
+
+  @Override
+  public boolean hasNext()
+  {
+    return !closed && !yielder.isDone();
+  }
+
+  @Override
+  public void close(boolean cascade)
+  {
+    if (closed) {
+      return;
+    }
+    try {
+      yielder.close();
+    }
+    catch (IOException e) {
+      throw new RE(e, "Exception when closing yielder from Sequence");
+    }
+    finally {
+      closed = true;
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorFactory.java b/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorFactory.java
new file mode 100644
index 000000000000..bc4cd5206c26
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorFactory.java
@@ -0,0 +1,68 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import com.google.common.base.Preconditions;
+import org.apache.druid.query.operator.window.Processor;
+
+public class WindowOperatorFactory implements OperatorFactory
+{
+  private Processor processor;
+
+  @JsonCreator
+  public WindowOperatorFactory(
+      @JsonProperty("processor") Processor processor
+  )
+  {
+    Preconditions.checkNotNull(processor, "processor cannot be null");
+    this.processor = processor;
+  }
+
+  @JsonProperty("processor")
+  public Processor getProcessor()
+  {
+    return processor;
+  }
+
+  @Override
+  public Operator wrap(Operator op)
+  {
+    return new WindowProcessorOperator(processor, op);
+  }
+
+  @Override
+  public boolean validateEquivalent(OperatorFactory other)
+  {
+    if (other instanceof WindowOperatorFactory) {
+      return processor.validateEquivalent(((WindowOperatorFactory) other).getProcessor());
+    }
+    return false;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "WindowOperatorFactory{" +
+           "processor=" + processor +
+           '}';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorQuery.java b/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorQuery.java
new file mode 100644
index 000000000000..99faf8068f38
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorQuery.java
@@ -0,0 +1,167 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.java.util.common.IAE;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.UOE;
+import org.apache.druid.query.BaseQuery;
+import org.apache.druid.query.DataSource;
+import org.apache.druid.query.InlineDataSource;
+import org.apache.druid.query.Query;
+import org.apache.druid.query.QueryDataSource;
+import org.apache.druid.query.filter.DimFilter;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.spec.LegacySegmentSpec;
+import org.apache.druid.query.spec.QuerySegmentSpec;
+import org.apache.druid.segment.column.RowSignature;
+
+import java.util.List;
+import java.util.Map;
+import java.util.Objects;
+
+/**
+ * A query that can compute window functions on top of a completely in-memory inline datasource or query results.
+ * <p>
+ * It relies on a set of Operators to work on the data that it is given.  As such, it doesn't actually encapsulate
+ * any window-specific logic in-and-of-itself, but rather delegates everything to the operators.  This is because
+ * this is also intended as the initial addition of more explicit Operators to the Druid code base.
+ * <p>
+ * The assumptions on the incoming data are defined by the operators.  At initial time of writing, there is a baked
+ * in assumption that data has been sorted "correctly" before this runs.
+ */
+public class WindowOperatorQuery extends BaseQuery<RowsAndColumns>
+{
+  private final RowSignature rowSignature;
+  private final List<OperatorFactory> operators;
+
+  @JsonCreator
+  public WindowOperatorQuery(
+      @JsonProperty("dataSource") DataSource dataSource,
+      @JsonProperty("context") Map<String, Object> context,
+      @JsonProperty("outputSignature") RowSignature rowSignature,
+      @JsonProperty("operatorDefinition") List<OperatorFactory> operators
+  )
+  {
+    super(dataSource, new LegacySegmentSpec(Intervals.ETERNITY), false, context);
+    this.rowSignature = rowSignature;
+    this.operators = operators;
+    if (!(dataSource instanceof QueryDataSource || dataSource instanceof InlineDataSource)) {
+      throw new IAE("WindowOperatorQuery must run on top of a query or inline data source, got [%s]", dataSource);
+    }
+  }
+
+  @JsonProperty("operatorDefinition")
+  public List<OperatorFactory> getOperators()
+  {
+    return operators;
+  }
+
+  @JsonProperty("outputSignature")
+  public RowSignature getRowSignature()
+  {
+    return rowSignature;
+  }
+
+  @Override
+  public boolean hasFilters()
+  {
+    return false;
+  }
+
+  @Override
+  public DimFilter getFilter()
+  {
+    return null;
+  }
+
+  @Override
+  public String getType()
+  {
+    return Query.WINDOW_OPERATOR;
+  }
+
+  @Override
+  public Query<RowsAndColumns> withOverriddenContext(Map<String, Object> contextOverride)
+  {
+    return new WindowOperatorQuery(
+        getDataSource(),
+        computeOverriddenContext(getContext(), contextOverride),
+        rowSignature,
+        operators
+    );
+  }
+
+  @Override
+  public Query<RowsAndColumns> withQuerySegmentSpec(QuerySegmentSpec spec)
+  {
+    throw new UOE("Cannot override querySegmentSpec on window operator query. [%s]", spec);
+  }
+
+  @Override
+  public Query<RowsAndColumns> withDataSource(DataSource dataSource)
+  {
+    return new WindowOperatorQuery(
+        dataSource,
+        getContext(),
+        rowSignature,
+        operators
+    );
+  }
+
+  @Override
+  public boolean equals(Object o)
+  {
+    if (this == o) {
+      return true;
+    }
+    if (o == null || getClass() != o.getClass()) {
+      return false;
+    }
+    if (!super.equals(o)) {
+      return false;
+    }
+    WindowOperatorQuery that = (WindowOperatorQuery) o;
+    return Objects.equals(rowSignature, that.rowSignature) && Objects.equals(
+        operators,
+        that.operators
+    );
+  }
+
+  @Override
+  public int hashCode()
+  {
+    return Objects.hash(super.hashCode(), rowSignature, operators);
+  }
+
+  @Override
+  public String toString()
+  {
+    return "WindowOperatorQuery{" +
+           "dataSource='" + getDataSource() + '\'' +
+           ", querySegmentSpec=" + getQuerySegmentSpec() +
+           ", context=" + getContext() +
+           ", rowSignature=" + rowSignature +
+           ", operators=" + operators +
+           '}';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorQueryQueryRunnerFactory.java b/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorQueryQueryRunnerFactory.java
new file mode 100644
index 000000000000..78f64360761e
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorQueryQueryRunnerFactory.java
@@ -0,0 +1,55 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.google.common.collect.Iterables;
+import org.apache.druid.query.QueryProcessingPool;
+import org.apache.druid.query.QueryRunner;
+import org.apache.druid.query.QueryRunnerFactory;
+import org.apache.druid.query.QueryToolChest;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.segment.Segment;
+
+public class WindowOperatorQueryQueryRunnerFactory implements QueryRunnerFactory<RowsAndColumns, WindowOperatorQuery>
+{
+  public static final WindowOperatorQueryQueryToolChest TOOLCHEST = new WindowOperatorQueryQueryToolChest();
+
+  @Override
+  public QueryRunner<RowsAndColumns> createRunner(Segment segment)
+  {
+    return (queryPlus, responseContext) ->
+        new OperatorSequence(() -> new SegmentToRowsAndColumnsOperator(segment));
+  }
+
+  @Override
+  public QueryRunner<RowsAndColumns> mergeRunners(
+      QueryProcessingPool queryProcessingPool,
+      Iterable<QueryRunner<RowsAndColumns>> queryRunners
+  )
+  {
+    return Iterables.getOnlyElement(queryRunners);
+  }
+
+  @Override
+  public QueryToolChest<RowsAndColumns, WindowOperatorQuery> getToolchest()
+  {
+    return TOOLCHEST;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorQueryQueryToolChest.java b/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorQueryQueryToolChest.java
new file mode 100644
index 000000000000..d02596900df0
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/WindowOperatorQueryQueryToolChest.java
@@ -0,0 +1,191 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.fasterxml.jackson.core.type.TypeReference;
+import com.google.common.base.Function;
+import com.google.common.base.Functions;
+import com.google.common.collect.ImmutableMap;
+import org.apache.druid.java.util.common.guava.Sequence;
+import org.apache.druid.java.util.common.guava.Sequences;
+import org.apache.druid.query.DefaultQueryMetrics;
+import org.apache.druid.query.QueryMetrics;
+import org.apache.druid.query.QueryPlus;
+import org.apache.druid.query.QueryRunner;
+import org.apache.druid.query.QueryToolChest;
+import org.apache.druid.query.aggregation.MetricManipulationFn;
+import org.apache.druid.query.context.ResponseContext;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.query.rowsandcols.column.NullColumnAccessor;
+import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.column.RowSignature;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.function.Supplier;
+
+public class WindowOperatorQueryQueryToolChest extends QueryToolChest<RowsAndColumns, WindowOperatorQuery>
+{
+
+  @Override
+  @SuppressWarnings("unchecked")
+  public QueryRunner<RowsAndColumns> mergeResults(QueryRunner<RowsAndColumns> runner)
+  {
+    return new RowsAndColumnsUnravelingQueryRunner(
+        (queryPlus, responseContext) -> {
+          final WindowOperatorQuery query = (WindowOperatorQuery) queryPlus.getQuery();
+          final List<OperatorFactory> opFactories = query.getOperators();
+
+          Supplier<Operator> opSupplier = () -> {
+            Operator retVal = new SequenceOperator(runner.run(queryPlus, responseContext));
+            for (OperatorFactory operatorFactory : opFactories) {
+              retVal = operatorFactory.wrap(retVal);
+            }
+            return retVal;
+          };
+
+          return new OperatorSequence(opSupplier);
+        }
+    );
+  }
+
+  @Override
+  public QueryMetrics<? super WindowOperatorQuery> makeMetrics(WindowOperatorQuery query)
+  {
+    return new DefaultQueryMetrics<>();
+  }
+
+  @Override
+  public Function<RowsAndColumns, RowsAndColumns> makePreComputeManipulatorFn(
+      WindowOperatorQuery query,
+      MetricManipulationFn fn
+  )
+  {
+    return Functions.identity();
+  }
+
+  @Override
+  public TypeReference<RowsAndColumns> getResultTypeReference()
+  {
+    return new TypeReference<RowsAndColumns>()
+    {
+    };
+  }
+
+  @Override
+  public RowSignature resultArraySignature(WindowOperatorQuery query)
+  {
+    return query.getRowSignature();
+  }
+
+  @Override
+  @SuppressWarnings({"unchecked", "rawtypes"})
+  public Sequence<Object[]> resultsAsArrays(
+      WindowOperatorQuery query,
+      Sequence<RowsAndColumns> resultSequence
+  )
+  {
+    // Dark magic; see RowsAndColumnsUnravelingQueryRunner.
+    return (Sequence) resultSequence;
+  }
+
+  /**
+   * This class exists to unravel the RowsAndColumns that are used in this query and make it the return Sequence
+   * actually be a Sequence of rows.  This is relatively broken in a number of regards, the most obvious of which
+   * is that it is going to run counter to the stated class on the Generic of the QueryToolChest.  That is, the
+   * code makes it look like you are getting a Sequence of RowsAndColumns, but, by using this, the query will
+   * actually ultimately produce a Sequence of Object[].  This works because of type Erasure in Java (it's all Object
+   * at the end of the day).
+   * <p>
+   * While it might seem like this will break all sorts of things, the Generic type is actually there more as a type
+   * "hint" to make the writing of the ToolChest and Factory and stuff a bit more simple.  Any caller of this cannot
+   * truly depend on the type anyway other than to just throw it across the wire, so this should just magically work
+   * even though it looks like it shouldn't even compile.
+   * <p>
+   * Not our proudest moment, but we use the tools available to us.
+   */
+  @SuppressWarnings({"unchecked", "rawtypes"})
+  private static class RowsAndColumnsUnravelingQueryRunner implements QueryRunner
+  {
+
+    private final QueryRunner<RowsAndColumns> baseQueryRunner;
+
+    private RowsAndColumnsUnravelingQueryRunner(
+        QueryRunner<RowsAndColumns> baseQueryRunner
+    )
+    {
+      this.baseQueryRunner = baseQueryRunner;
+    }
+
+    @Override
+    public Sequence run(
+        QueryPlus queryPlus,
+        ResponseContext responseContext
+    )
+    {
+      // We only want to do this operation once at the very, very top of the execution tree.  So we check and set
+      // a context parameter so that if this merge code runs anywhere else, it will skip this part.
+      final WindowOperatorQuery query = (WindowOperatorQuery) queryPlus.getQuery();
+      if (query.context().getBoolean("unravel", true)) {
+        final Sequence<RowsAndColumns> baseSequence = baseQueryRunner.run(
+            queryPlus.withQuery(query.withOverriddenContext(ImmutableMap.of("unravel", false))),
+            responseContext
+        );
+
+        final RowSignature rowSignature = query.getRowSignature();
+        return baseSequence.flatMap(
+            rac -> {
+              List<Object[]> results = new ArrayList<>(rac.numRows());
+
+              ColumnAccessor[] accessors = new ColumnAccessor[rowSignature.size()];
+              int index = 0;
+              for (String columnName : rowSignature.getColumnNames()) {
+                final Column column = rac.findColumn(columnName);
+                if (column == null) {
+                  final ColumnType columnType = rowSignature
+                      .getColumnType(columnName)
+                      .orElse(ColumnType.UNKNOWN_COMPLEX);
+
+                  accessors[index] = new NullColumnAccessor(columnType, rac.numRows());
+                } else {
+                  accessors[index] = column.toAccessor();
+                }
+                ++index;
+              }
+
+              for (int i = 0; i < rac.numRows(); ++i) {
+                Object[] objArr = new Object[accessors.length];
+                for (int j = 0; j < accessors.length; j++) {
+                  objArr[j] = accessors[j].getObject(i);
+                }
+                results.add(objArr);
+              }
+
+              return Sequences.simple(results);
+            }
+        );
+      }
+
+      return baseQueryRunner.run(queryPlus, responseContext);
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/WindowProcessorOperator.java b/processing/src/main/java/org/apache/druid/query/operator/WindowProcessorOperator.java
new file mode 100644
index 000000000000..d95f598d3993
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/WindowProcessorOperator.java
@@ -0,0 +1,67 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+
+/**
+ * An Operator that applies a {@link Processor}, see javadoc on that interface for an explanation.
+ */
+public class WindowProcessorOperator implements Operator
+{
+  private final Processor windowProcessor;
+  private final Operator child;
+
+  public WindowProcessorOperator(
+      Processor windowProcessor,
+      Operator child
+  )
+  {
+    this.windowProcessor = windowProcessor;
+    this.child = child;
+  }
+
+  @Override
+  public void open()
+  {
+    child.open();
+  }
+
+  @Override
+  public RowsAndColumns next()
+  {
+    return windowProcessor.process(child.next());
+  }
+
+  @Override
+  public boolean hasNext()
+  {
+    return child.hasNext();
+  }
+
+  @Override
+  public void close(boolean cascade)
+  {
+    if (cascade) {
+      child.close(cascade);
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/ComposingProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/ComposingProcessor.java
new file mode 100644
index 000000000000..a4fa74967f61
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/ComposingProcessor.java
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+
+import java.util.Arrays;
+
+public class ComposingProcessor implements Processor
+{
+  private final Processor[] processors;
+
+  @JsonCreator
+  public ComposingProcessor(
+      @JsonProperty("processors") Processor... processors
+  )
+  {
+    this.processors = processors;
+  }
+
+  @JsonProperty("processors")
+  public Processor[] getProcessors()
+  {
+    return processors;
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns incomingPartition)
+  {
+    RowsAndColumns retVal = incomingPartition;
+    for (int i = processors.length - 1; i >= 0; --i) {
+      retVal = processors[i].process(retVal);
+    }
+    return retVal;
+  }
+
+  @Override
+  public boolean validateEquivalent(Processor otherProcessor)
+  {
+    if (otherProcessor instanceof ComposingProcessor) {
+      ComposingProcessor other = (ComposingProcessor) otherProcessor;
+      for (int i = 0; i < processors.length; ++i) {
+        if (!processors[i].validateEquivalent(other.processors[i])) {
+          return false;
+        }
+      }
+      return true;
+    }
+    return false;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "ComposingProcessor{" +
+           "processors=" + Arrays.toString(processors) +
+           '}';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/Processor.java b/processing/src/main/java/org/apache/druid/query/operator/window/Processor.java
new file mode 100644
index 000000000000..94e8c74a6b50
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/Processor.java
@@ -0,0 +1,83 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window;
+
+import com.fasterxml.jackson.annotation.JsonSubTypes;
+import com.fasterxml.jackson.annotation.JsonTypeInfo;
+import org.apache.druid.query.operator.window.ranking.WindowCumeDistProcessor;
+import org.apache.druid.query.operator.window.ranking.WindowDenseRankProcessor;
+import org.apache.druid.query.operator.window.ranking.WindowPercentileProcessor;
+import org.apache.druid.query.operator.window.ranking.WindowRankProcessor;
+import org.apache.druid.query.operator.window.ranking.WindowRowNumberProcessor;
+import org.apache.druid.query.operator.window.value.WindowFirstProcessor;
+import org.apache.druid.query.operator.window.value.WindowLastProcessor;
+import org.apache.druid.query.operator.window.value.WindowOffsetProcessor;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+
+/**
+ * A Processor is a bit of logic that processes a single RowsAndColumns object to produce a new RowsAndColumns
+ * object.  Generally speaking, it is used to add or alter columns in a batch-oriented fashion.
+ * <p>
+ * This interface was created to support windowing functions, where the windowing function can be implemented
+ * assuming that each RowsAndColumns object represents one partition.  Thus, the window function implementation
+ * can only need to worry about how to process a single partition at a time and something external to the window
+ * function worries about providing data with the correct partitioning.
+ * <p>
+ * Over time, it's possible that this interface is used for other purposes as well, but the fundamental idea of
+ * usages of the interface should always be doing a one-to-one transformation of RowsAndColumns objects.  That is,
+ * it's a RowsAndColumns in and a RowsAndColumns out.
+ */
+@JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type")
+@JsonSubTypes(value = {
+    @JsonSubTypes.Type(name = "composing", value = ComposingProcessor.class),
+    @JsonSubTypes.Type(name = "cumeDist", value = WindowCumeDistProcessor.class),
+    @JsonSubTypes.Type(name = "denseRank", value = WindowDenseRankProcessor.class),
+    @JsonSubTypes.Type(name = "percentile", value = WindowPercentileProcessor.class),
+    @JsonSubTypes.Type(name = "rank", value = WindowRankProcessor.class),
+    @JsonSubTypes.Type(name = "rowNumber", value = WindowRowNumberProcessor.class),
+    @JsonSubTypes.Type(name = "first", value = WindowFirstProcessor.class),
+    @JsonSubTypes.Type(name = "last", value = WindowLastProcessor.class),
+    @JsonSubTypes.Type(name = "offset", value = WindowOffsetProcessor.class),
+    @JsonSubTypes.Type(name = "aggregate", value = WindowAggregateProcessor.class),
+})
+public interface Processor
+{
+  /**
+   * Applies the logic of the processor to a RowsAndColumns object
+   *
+   * @param incomingPartition the incoming RowsAndColumns object
+   * @return the transformed RowsAndColumns object
+   */
+  RowsAndColumns process(RowsAndColumns incomingPartition);
+
+  /**
+   * Validates the equivalence of the Processors.  This is similar to @{code .equals} but is its own method
+   * so that it can ignore certain fields that would be important for a true equality check.  Namely, two Processors
+   * defined the same way but with different output names can be considered equivalent even though they are not equal.
+   * <p>
+   * This primarily exists to simplify tests, where this equivalence can be used to validate that the Processors
+   * created by the SQL planner are actually equivalent to what we expect without needing to be overly dependent on
+   * how the planner names the output columns
+   *
+   * @param otherProcessor the processor to test equivalence of
+   * @return boolean identifying if these processors should be considered equivalent to each other.
+   */
+  boolean validateEquivalent(Processor otherProcessor);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/WindowAggregateProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/WindowAggregateProcessor.java
new file mode 100644
index 000000000000..630d1145f770
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/WindowAggregateProcessor.java
@@ -0,0 +1,131 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.query.aggregation.AggregatorFactory;
+import org.apache.druid.query.rowsandcols.AppendableRowsAndColumns;
+import org.apache.druid.query.rowsandcols.DefaultOnHeapAggregatable;
+import org.apache.druid.query.rowsandcols.OnHeapAggregatable;
+import org.apache.druid.query.rowsandcols.OnHeapCumulativeAggregatable;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.ConstantObjectColumn;
+import org.apache.druid.query.rowsandcols.column.ObjectArrayColumn;
+
+import javax.annotation.Nullable;
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Objects;
+
+public class WindowAggregateProcessor implements Processor
+{
+  @Nullable
+  private static <T> List<T> emptyToNull(List<T> list)
+  {
+    if (list == null || list.isEmpty()) {
+      return null;
+    } else {
+      return list;
+    }
+  }
+
+  private final List<AggregatorFactory> aggregations;
+  private final List<AggregatorFactory> cumulativeAggregations;
+
+  @JsonCreator
+  public WindowAggregateProcessor(
+      @JsonProperty("aggregations") List<AggregatorFactory> aggregations,
+      @JsonProperty("cumulativeAggregations") List<AggregatorFactory> cumulativeAggregations
+  )
+  {
+    this.aggregations = emptyToNull(aggregations);
+    this.cumulativeAggregations = emptyToNull(cumulativeAggregations);
+  }
+
+  @JsonProperty("aggregations")
+  public List<AggregatorFactory> getAggregations()
+  {
+    return aggregations;
+  }
+
+  @JsonProperty("cumulativeAggregations")
+  public List<AggregatorFactory> getCumulativeAggregations()
+  {
+    return cumulativeAggregations;
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns inputPartition)
+  {
+    AppendableRowsAndColumns retVal = RowsAndColumns.expectAppendable(inputPartition);
+
+    if (aggregations != null) {
+      OnHeapAggregatable aggregatable = inputPartition.as(OnHeapAggregatable.class);
+      if (aggregatable == null) {
+        aggregatable = new DefaultOnHeapAggregatable(inputPartition);
+      }
+      final ArrayList<Object> aggregatedVals = aggregatable.aggregateAll(aggregations);
+
+      for (int i = 0; i < aggregations.size(); ++i) {
+        final AggregatorFactory agg = aggregations.get(i);
+        retVal.addColumn(
+            agg.getName(),
+            new ConstantObjectColumn(aggregatedVals.get(i), inputPartition.numRows(), agg.getResultType())
+        );
+      }
+    }
+
+    if (cumulativeAggregations != null) {
+      OnHeapCumulativeAggregatable cummulativeAgg = inputPartition.as(OnHeapCumulativeAggregatable.class);
+      if (cummulativeAgg == null) {
+        cummulativeAgg = new DefaultOnHeapAggregatable(inputPartition);
+      }
+      final ArrayList<Object[]> cumulativeVals = cummulativeAgg.aggregateCumulative(cumulativeAggregations);
+
+      for (int i = 0; i < cumulativeAggregations.size(); ++i) {
+        final AggregatorFactory agg = cumulativeAggregations.get(i);
+        retVal.addColumn(agg.getName(), new ObjectArrayColumn(cumulativeVals.get(i), agg.getResultType()));
+      }
+    }
+
+    return retVal;
+  }
+
+  @Override
+  public boolean validateEquivalent(Processor otherProcessor)
+  {
+    if (otherProcessor instanceof WindowAggregateProcessor) {
+      WindowAggregateProcessor other = (WindowAggregateProcessor) otherProcessor;
+      return Objects.equals(aggregations, other.aggregations)
+             && Objects.equals(cumulativeAggregations, other.cumulativeAggregations);
+    }
+    return false;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "WindowAggregateProcessor{" +
+           "aggregations=" + aggregations +
+           ", cumulativeAggregations=" + cumulativeAggregations +
+           '}';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowCumeDistProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowCumeDistProcessor.java
new file mode 100644
index 000000000000..c798081339e7
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowCumeDistProcessor.java
@@ -0,0 +1,60 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.DoubleArrayColumn;
+
+import java.util.Arrays;
+import java.util.List;
+
+/**
+ * This Processor assumes that data has already been sorted for it.  It does not re-sort the data and if it is given
+ * data that is not in the correct sorted order, its operation is undefined.
+ */
+public class WindowCumeDistProcessor extends WindowRankingProcessorBase
+{
+  @JsonCreator
+  public WindowCumeDistProcessor(
+      @JsonProperty("group") List<String> groupingCols,
+      @JsonProperty("outputColumn") String outputColumn
+  )
+  {
+    super(groupingCols, outputColumn);
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns incomingPartition)
+  {
+    return processInternal(incomingPartition, groupings -> {
+      final double[] ranks = new double[incomingPartition.numRows()];
+      for (int i = 1; i < groupings.length; ++i) {
+        final int start = groupings[i - 1];
+        final int end = groupings[i];
+        double relativeRank = end / (double) ranks.length;
+        Arrays.fill(ranks, start, end, relativeRank);
+      }
+
+      return new DoubleArrayColumn(ranks);
+    });
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowDenseRankProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowDenseRankProcessor.java
new file mode 100644
index 000000000000..24b05a6f3460
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowDenseRankProcessor.java
@@ -0,0 +1,59 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+
+import java.util.Arrays;
+import java.util.List;
+
+/**
+ * This Processor assumes that data has already been sorted for it.  It does not re-sort the data and if it is given
+ * data that is not in the correct sorted order, its operation is undefined.
+ */
+public class WindowDenseRankProcessor extends WindowRankingProcessorBase
+{
+  @JsonCreator
+  public WindowDenseRankProcessor(
+      @JsonProperty("group") List<String> groupingCols,
+      @JsonProperty("outputColumn") String outputColumn
+  )
+  {
+    super(groupingCols, outputColumn);
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns incomingPartition)
+  {
+    return processInternal(incomingPartition, groupings -> {
+      final int[] ranks = new int[incomingPartition.numRows()];
+      for (int i = 1; i < groupings.length; ++i) {
+        final int start = groupings[i - 1];
+        final int end = groupings[i];
+        Arrays.fill(ranks, start, end, i);
+      }
+
+      return new IntArrayColumn(ranks);
+    });
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowPercentileProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowPercentileProcessor.java
new file mode 100644
index 000000000000..e8c9aec2ab4c
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowPercentileProcessor.java
@@ -0,0 +1,106 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import com.google.common.base.Preconditions;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.rowsandcols.AppendableRowsAndColumns;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+
+import java.util.Arrays;
+
+public class WindowPercentileProcessor implements Processor
+{
+  private final int numBuckets;
+  private final String outputColumn;
+
+  @JsonCreator
+  public WindowPercentileProcessor(
+      @JsonProperty("outputColumn") String outputColumn,
+      @JsonProperty("numBuckets") int numBuckets
+  )
+  {
+    Preconditions.checkArgument(numBuckets > 0, "numBuckets[%s] must be greater than zero", numBuckets);
+
+    this.outputColumn = outputColumn;
+    this.numBuckets = numBuckets;
+  }
+
+  @JsonProperty("numBuckets")
+  public int getNumBuckets()
+  {
+    return numBuckets;
+  }
+
+  @JsonProperty("outputColumn")
+  public String getOutputColumn()
+  {
+    return outputColumn;
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns incomingPartition)
+  {
+    AppendableRowsAndColumns retVal = RowsAndColumns.expectAppendable(incomingPartition);
+
+    int numRows = incomingPartition.numRows();
+    int countPerBucket = numRows / numBuckets;
+    int extraRows = numRows % numBuckets;
+
+    int index = 0;
+    int[] bucketVals = new int[numRows];
+    for (int i = 0; i < numBuckets; ++i) {
+      int nextIndex = index + countPerBucket;
+      if (extraRows > 0) {
+        ++nextIndex;
+        --extraRows;
+      }
+
+      // Buckets are 1-indexed, so we fill with i+1
+      Arrays.fill(bucketVals, index, nextIndex, i + 1);
+
+      index = nextIndex;
+    }
+
+    retVal.addColumn(outputColumn, new IntArrayColumn(bucketVals));
+    return retVal;
+  }
+
+  @Override
+  public boolean validateEquivalent(Processor otherProcessor)
+  {
+    if (otherProcessor instanceof WindowPercentileProcessor) {
+      return numBuckets == ((WindowPercentileProcessor) otherProcessor).numBuckets;
+    }
+    return false;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "WindowPercentileProcessor{" +
+           "numBuckets=" + numBuckets +
+           ", outputColumn='" + outputColumn + '\'' +
+           '}';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowRankProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowRankProcessor.java
new file mode 100644
index 000000000000..2d9b21863de8
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowRankProcessor.java
@@ -0,0 +1,108 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.DoubleArrayColumn;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+
+import java.util.Arrays;
+import java.util.List;
+
+/**
+ * This Processor assumes that data has already been sorted for it.  It does not re-sort the data and if it is given
+ * data that is not in the correct sorted order, its operation is undefined.
+ */
+public class WindowRankProcessor extends WindowRankingProcessorBase
+{
+  private final boolean asPercent;
+
+  @JsonCreator
+  public WindowRankProcessor(
+      @JsonProperty("group") List<String> groupingCols,
+      @JsonProperty("outputColumn") String outputColumn,
+      @JsonProperty("asPercent") boolean asPercent
+  )
+  {
+    super(groupingCols, outputColumn);
+    this.asPercent = asPercent;
+  }
+
+  @JsonProperty("asPercent")
+  public boolean isAsPercent()
+  {
+    return asPercent;
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns incomingPartition)
+  {
+    if (asPercent) {
+      return processInternal(incomingPartition, groupings -> {
+        final double[] percentages = new double[incomingPartition.numRows()];
+        if (percentages.length > 1) {
+          final double denominator = percentages.length - 1;
+
+          for (int i = 1; i < groupings.length; ++i) {
+            final int start = groupings[i - 1];
+            final int end = groupings[i];
+            Arrays.fill(percentages, start, end, start / denominator);
+          }
+        }
+
+        return new DoubleArrayColumn(percentages);
+      });
+    }
+
+    return processInternal(incomingPartition, groupings -> {
+      final int[] ranks = new int[incomingPartition.numRows()];
+
+      for (int i = 1; i < groupings.length; ++i) {
+        final int start = groupings[i - 1];
+        final int end = groupings[i];
+        Arrays.fill(ranks, start, end, start + 1);
+      }
+
+      return new IntArrayColumn(ranks);
+    });
+  }
+
+  @Override
+  public boolean validateEquivalent(Processor otherProcessor)
+  {
+    if (otherProcessor instanceof WindowRankProcessor) {
+      WindowRankProcessor other = (WindowRankProcessor) otherProcessor;
+      return asPercent == other.asPercent && intervalValidation(other);
+    }
+    return false;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "WindowRankProcessor{" +
+           internalToString() +
+           ", asPercent=" + asPercent +
+           '}';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowRankingProcessorBase.java b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowRankingProcessorBase.java
new file mode 100644
index 000000000000..105c586aa195
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowRankingProcessorBase.java
@@ -0,0 +1,103 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.rowsandcols.AppendableRowsAndColumns;
+import org.apache.druid.query.rowsandcols.DefaultSortedGroupPartitioner;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.SortedGroupPartitioner;
+import org.apache.druid.query.rowsandcols.column.Column;
+
+import java.util.List;
+import java.util.function.Function;
+
+/**
+ * This Processor assumes that data has already been sorted for it.  It does not re-sort the data and if it is given
+ * data that is not in the correct sorted order, its operation is undefined.
+ */
+public abstract class WindowRankingProcessorBase implements Processor
+{
+  private final List<String> groupingCols;
+  private final String outputColumn;
+
+  public WindowRankingProcessorBase(
+      List<String> groupingCols,
+      String outputColumn
+  )
+  {
+    this.groupingCols = groupingCols;
+    this.outputColumn = outputColumn;
+  }
+
+  @JsonProperty("group")
+  public List<String> getGroupingCols()
+  {
+    return groupingCols;
+  }
+
+  @JsonProperty("outputColumn")
+  public String getOutputColumn()
+  {
+    return outputColumn;
+  }
+
+  public RowsAndColumns processInternal(
+      RowsAndColumns incomingPartition,
+      Function<int[], Column> fn
+  )
+  {
+    final AppendableRowsAndColumns retVal = RowsAndColumns.expectAppendable(incomingPartition);
+
+    SortedGroupPartitioner groupPartitioner = incomingPartition.as(SortedGroupPartitioner.class);
+    if (groupPartitioner == null) {
+      groupPartitioner = new DefaultSortedGroupPartitioner(incomingPartition);
+    }
+
+    retVal.addColumn(outputColumn, fn.apply(groupPartitioner.computeBoundaries(groupingCols)));
+    return retVal;
+  }
+
+  @Override
+  public boolean validateEquivalent(Processor otherProcessor)
+  {
+    return getClass() == otherProcessor.getClass()
+           && intervalValidation((WindowRankingProcessorBase) otherProcessor);
+  }
+
+  protected boolean intervalValidation(WindowRankingProcessorBase other)
+  {
+    // Only input needs to be the same for the processors to produce equivalent results
+    return groupingCols.equals(other.groupingCols);
+  }
+
+  @Override
+  public String toString()
+  {
+    return getClass().getSimpleName() + "{" + internalToString() + '}';
+  }
+
+  protected String internalToString()
+  {
+    return "groupingCols=" + groupingCols +
+           ", outputColumn='" + outputColumn + '\'';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowRowNumberProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowRowNumberProcessor.java
new file mode 100644
index 000000000000..6c998afa6099
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/ranking/WindowRowNumberProcessor.java
@@ -0,0 +1,131 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.rowsandcols.AppendableRowsAndColumns;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessorBasedColumn;
+import org.apache.druid.segment.column.ColumnType;
+
+public class WindowRowNumberProcessor implements Processor
+{
+  private final String outputColumn;
+
+  @JsonCreator
+  public WindowRowNumberProcessor(
+      @JsonProperty("outputColumn") String outputColumn
+  )
+  {
+    this.outputColumn = outputColumn;
+  }
+
+  @JsonProperty("outputColumn")
+  public String getOutputColumn()
+  {
+    return outputColumn;
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns incomingPartition)
+  {
+    final AppendableRowsAndColumns retVal = RowsAndColumns.expectAppendable(incomingPartition);
+    retVal.addColumn(
+        outputColumn,
+        new ColumnAccessorBasedColumn(
+            new ColumnAccessor()
+            {
+              @Override
+              public ColumnType getType()
+              {
+                return ColumnType.LONG;
+              }
+
+              @Override
+              public int numRows()
+              {
+                return incomingPartition.numRows();
+              }
+
+              @Override
+              public boolean isNull(int rowNum)
+              {
+                return false;
+              }
+
+              @Override
+              public Object getObject(int rowNum)
+              {
+                return getInt(rowNum);
+              }
+
+              @Override
+              public double getDouble(int rowNum)
+              {
+                return getInt(rowNum);
+              }
+
+              @Override
+              public float getFloat(int rowNum)
+              {
+                return getInt(rowNum);
+              }
+
+              @Override
+              public long getLong(int rowNum)
+              {
+                return getInt(rowNum);
+              }
+
+              @Override
+              public int getInt(int rowNum)
+              {
+                // cell is 0-indexed, rowNumbers are 1-indexed, so add 1.
+                return rowNum + 1;
+              }
+
+              @Override
+              public int compareCells(int lhsRowNum, int rhsRowNum)
+              {
+                return Integer.compare(lhsRowNum, rhsRowNum);
+              }
+            }
+        )
+    );
+    return retVal;
+  }
+
+  @Override
+  public boolean validateEquivalent(Processor otherProcessor)
+  {
+    return otherProcessor instanceof WindowRowNumberProcessor;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "WindowRowNumberProcessor{" +
+           "outputColumn='" + outputColumn + '\'' +
+           '}';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/value/ShiftedColumnAccessorBase.java b/processing/src/main/java/org/apache/druid/query/operator/window/value/ShiftedColumnAccessorBase.java
new file mode 100644
index 000000000000..22288a197f2d
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/value/ShiftedColumnAccessorBase.java
@@ -0,0 +1,130 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.value;
+
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.segment.column.ColumnType;
+
+public abstract class ShiftedColumnAccessorBase implements ColumnAccessor
+{
+  private final ColumnAccessor accessor;
+
+  public ShiftedColumnAccessorBase(ColumnAccessor accessor)
+  {
+    this.accessor = accessor;
+  }
+
+  @Override
+  public ColumnType getType()
+  {
+    return accessor.getType();
+  }
+
+  @Override
+  public int numRows()
+  {
+    return accessor.numRows();
+  }
+
+  @Override
+  public boolean isNull(int rowNum)
+  {
+    final int actualCell = getActualCell(rowNum);
+    if (outsideBounds(actualCell)) {
+      return true;
+    }
+    return accessor.isNull(actualCell);
+  }
+
+  @Override
+  public Object getObject(int rowNum)
+  {
+    final int actualCell = getActualCell(rowNum);
+    if (outsideBounds(actualCell)) {
+      return null;
+    }
+    return accessor.getObject(actualCell);
+  }
+
+  @Override
+  public double getDouble(int rowNum)
+  {
+    final int actualCell = getActualCell(rowNum);
+    if (outsideBounds(actualCell)) {
+      return 0.0D;
+    }
+    return accessor.getDouble(actualCell);
+  }
+
+  @Override
+  public float getFloat(int rowNum)
+  {
+    final int actualCell = getActualCell(rowNum);
+    if (outsideBounds(actualCell)) {
+      return 0.0F;
+    }
+    return accessor.getFloat(actualCell);
+  }
+
+  @Override
+  public long getLong(int rowNum)
+  {
+    final int actualCell = getActualCell(rowNum);
+    if (outsideBounds(actualCell)) {
+      return 0L;
+    }
+    return accessor.getLong(actualCell);
+  }
+
+  @Override
+  public int getInt(int rowNum)
+  {
+    final int actualCell = getActualCell(rowNum);
+    if (outsideBounds(actualCell)) {
+      return 0;
+    }
+    return accessor.getInt(actualCell);
+  }
+
+  @Override
+  public int compareCells(int lhsRowNum, int rhsRowNum)
+  {
+    int actualLhsCell = getActualCell(lhsRowNum);
+    int actualRhsCell = getActualCell(rhsRowNum);
+    if (outsideBounds(actualLhsCell)) {
+      if (outsideBounds(actualRhsCell)) {
+        // Both are null
+        return 0;
+      } else {
+        return accessor.isNull(actualRhsCell) ? 0 : -1;
+      }
+    } else {
+      if (outsideBounds(actualRhsCell)) {
+        return accessor.isNull(actualLhsCell) ? 0 : 1;
+      } else {
+        return accessor.compareCells(actualLhsCell, actualRhsCell);
+      }
+    }
+  }
+
+  protected abstract int getActualCell(int cell);
+
+  protected abstract boolean outsideBounds(int cell);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowFirstProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowFirstProcessor.java
new file mode 100644
index 000000000000..fe0cca8884c3
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowFirstProcessor.java
@@ -0,0 +1,50 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.value;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.query.rowsandcols.column.ConstantObjectColumn;
+
+public class WindowFirstProcessor extends WindowValueProcessorBase
+{
+  @JsonCreator
+  public WindowFirstProcessor(
+      @JsonProperty("inputColumn") String inputColumn,
+      @JsonProperty("outputColumn") String outputColumn
+  )
+  {
+    super(inputColumn, outputColumn);
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns incomingPartition)
+  {
+    return processInternal(
+        incomingPartition,
+        column -> {
+          final ColumnAccessor accessor = column.toAccessor();
+          return new ConstantObjectColumn(accessor.getObject(0), accessor.numRows(), accessor.getType());
+        }
+    );
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowLastProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowLastProcessor.java
new file mode 100644
index 000000000000..2e28962e4346
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowLastProcessor.java
@@ -0,0 +1,53 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.value;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.query.rowsandcols.column.ConstantObjectColumn;
+
+public class WindowLastProcessor extends WindowValueProcessorBase
+{
+  @JsonCreator
+  public WindowLastProcessor(
+      @JsonProperty("inputColumn") String inputColumn,
+      @JsonProperty("outputColumn") String outputColumn
+  )
+  {
+    super(inputColumn, outputColumn);
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns input)
+  {
+    final int lastIndex = input.numRows() - 1;
+    if (lastIndex < 0) {
+      throw new ISE("Called with an input partition of size 0.  The call site needs to not do that.");
+    }
+
+    return processInternal(input, column -> {
+      final ColumnAccessor accessor = column.toAccessor();
+      return new ConstantObjectColumn(accessor.getObject(lastIndex), accessor.numRows(), accessor.getType());
+    });
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowOffsetProcessor.java b/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowOffsetProcessor.java
new file mode 100644
index 000000000000..4128731be840
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowOffsetProcessor.java
@@ -0,0 +1,89 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.value;
+
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessorBasedColumn;
+
+public class WindowOffsetProcessor extends WindowValueProcessorBase
+{
+  private final int offset;
+
+  @JsonCreator
+  public WindowOffsetProcessor(
+      @JsonProperty("inputColumn") String inputColumn,
+      @JsonProperty("outputColumn") String outputColumn,
+      @JsonProperty("offset") int offset
+  )
+  {
+    super(inputColumn, outputColumn);
+    this.offset = offset;
+  }
+
+  @JsonProperty("offset")
+  public int getOffset()
+  {
+    return offset;
+  }
+
+  @Override
+  public RowsAndColumns process(RowsAndColumns input)
+  {
+    final int numRows = input.numRows();
+
+    return processInternal(input, column -> new ColumnAccessorBasedColumn(
+        new ShiftedColumnAccessorBase(column.toAccessor())
+        {
+          @Override
+          protected int getActualCell(int cell)
+          {
+            return cell + offset;
+          }
+
+          @Override
+          protected boolean outsideBounds(int actualCell)
+          {
+            return actualCell < 0 || actualCell >= numRows;
+          }
+        }));
+  }
+
+  @Override
+  public boolean validateEquivalent(Processor otherProcessor)
+  {
+    if (otherProcessor instanceof WindowOffsetProcessor) {
+      WindowOffsetProcessor other = (WindowOffsetProcessor) otherProcessor;
+      return offset == other.offset && intervalValidation(other);
+    }
+    return false;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "WindowOffsetProcessor{" +
+           internalToString() +
+           ", offset=" + offset +
+           '}';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowValueProcessorBase.java b/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowValueProcessorBase.java
new file mode 100644
index 000000000000..5486f69b9d3b
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/operator/window/value/WindowValueProcessorBase.java
@@ -0,0 +1,103 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.value;
+
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.rowsandcols.AppendableRowsAndColumns;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+
+import java.util.function.Function;
+
+public abstract class WindowValueProcessorBase implements Processor
+{
+  private final String inputColumn;
+  private final String outputColumn;
+
+  public WindowValueProcessorBase(
+      String inputColumn,
+      String outputColumn
+  )
+  {
+    this.inputColumn = inputColumn;
+    this.outputColumn = outputColumn;
+  }
+
+  @JsonProperty("inputColumn")
+  public String getInputColumn()
+  {
+    return inputColumn;
+  }
+
+  @JsonProperty("outputColumn")
+  public String getOutputColumn()
+  {
+    return outputColumn;
+  }
+
+  /**
+   * This implements the common logic between the various value processors.  It looks like it could be static, but if
+   * it is static then the lambda becomes polymorphic.  We keep it as a member method of the base class so taht the
+   * JVM can inline it and specialize the lambda
+   *
+   * @param input incoming RowsAndColumns, as in Processor.process
+   * @param fn    function that converts the input column into the output column
+   * @return RowsAndColumns, as in Processor.process
+   */
+  public RowsAndColumns processInternal(RowsAndColumns input, Function<Column, Column> fn)
+  {
+    final AppendableRowsAndColumns retVal = RowsAndColumns.expectAppendable(input);
+
+    final Column column = input.findColumn(inputColumn);
+    if (column == null) {
+      throw new ISE("column[%s] doesn't exist, but window function FIRST wants it to", inputColumn);
+    }
+
+    retVal.addColumn(outputColumn, fn.apply(column));
+    return retVal;
+  }
+
+  @Override
+  public boolean validateEquivalent(Processor otherProcessor)
+  {
+    return getClass() == otherProcessor.getClass()
+           && intervalValidation((WindowValueProcessorBase) otherProcessor);
+  }
+
+  protected boolean intervalValidation(WindowValueProcessorBase other)
+  {
+    // Only input needs to be the same for the processors to produce equivalent results
+    return inputColumn.equals(other.inputColumn);
+  }
+
+  @Override
+  public String toString()
+  {
+    return getClass().getSimpleName() + "{" + internalToString() + '}';
+  }
+
+  protected String internalToString()
+  {
+    return "inputColumn=" + inputColumn +
+           ", outputColumn='" + outputColumn + '\'';
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/planning/DataSourceAnalysis.java b/processing/src/main/java/org/apache/druid/query/planning/DataSourceAnalysis.java
index c329e3a57089..63c2c8b815d5 100644
--- a/processing/src/main/java/org/apache/druid/query/planning/DataSourceAnalysis.java
+++ b/processing/src/main/java/org/apache/druid/query/planning/DataSourceAnalysis.java
@@ -28,6 +28,7 @@
 import org.apache.druid.query.QueryDataSource;
 import org.apache.druid.query.TableDataSource;
 import org.apache.druid.query.UnionDataSource;
+import org.apache.druid.query.UnnestDataSource;
 import org.apache.druid.query.filter.DimFilter;
 import org.apache.druid.query.spec.QuerySegmentSpec;
 
@@ -112,17 +113,29 @@ public static DataSourceAnalysis forDataSource(final DataSource dataSource)
     Query<?> baseQuery = null;
     DataSource current = dataSource;
 
-    while (current instanceof QueryDataSource) {
-      final Query<?> subQuery = ((QueryDataSource) current).getQuery();
+    // This needs to be an or condition between QueryDataSource and UnnestDataSource
+    // As queries can have interleaving query and unnest data sources.
+    // Ideally if each data source generate their own analysis object we can avoid the or here
+    // and have cleaner code. Especially as we increase the types of data sources in future
+    // these or checks will be tedious. Future development should move forDataSource method
+    // into each data source.
 
-      if (!(subQuery instanceof BaseQuery)) {
-        // We must verify that the subQuery is a BaseQuery, because it is required to make "getBaseQuerySegmentSpec"
-        // work properly. All built-in query types are BaseQuery, so we only expect this with funky extension queries.
-        throw new IAE("Cannot analyze subquery of class[%s]", subQuery.getClass().getName());
-      }
+    while (current instanceof QueryDataSource || current instanceof UnnestDataSource) {
+      if (current instanceof QueryDataSource) {
+        final Query<?> subQuery = ((QueryDataSource) current).getQuery();
+
+        if (!(subQuery instanceof BaseQuery)) {
+          // We must verify that the subQuery is a BaseQuery, because it is required to make "getBaseQuerySegmentSpec"
+          // work properly. All built-in query types are BaseQuery, so we only expect this with funky extension queries.
+          throw new IAE("Cannot analyze subquery of class[%s]", subQuery.getClass().getName());
+        }
 
-      baseQuery = subQuery;
-      current = subQuery.getDataSource();
+        baseQuery = subQuery;
+        current = subQuery.getDataSource();
+      } else {
+        final UnnestDataSource unnestDataSource = (UnnestDataSource) current;
+        current = unnestDataSource.getBase();
+      }
     }
 
     if (current instanceof JoinDataSource) {
@@ -276,7 +289,8 @@ public boolean isConcreteBased()
 
   /**
    * Returns true if this datasource is concrete-based (see {@link #isConcreteBased()}, and the base datasource is a
-   * {@link TableDataSource} or a {@link UnionDataSource} composed entirely of {@link TableDataSource}. This is an
+   * {@link TableDataSource} or a {@link UnionDataSource} composed entirely of {@link TableDataSource}
+   * or an {@link UnnestDataSource} composed entirely of {@link TableDataSource} . This is an
    * important property, because it corresponds to datasources that can be handled by Druid's distributed query stack.
    */
   public boolean isConcreteTableBased()
@@ -286,6 +300,10 @@ public boolean isConcreteTableBased()
     // so check anyway for future-proofing.
     return isConcreteBased() && (baseDataSource instanceof TableDataSource
                                  || (baseDataSource instanceof UnionDataSource &&
+                                     baseDataSource.getChildren()
+                                                   .stream()
+                                                   .allMatch(ds -> ds instanceof TableDataSource))
+                                 || (baseDataSource instanceof UnnestDataSource &&
                                      baseDataSource.getChildren()
                                                    .stream()
                                                    .allMatch(ds -> ds instanceof TableDataSource)));
@@ -298,6 +316,7 @@ public boolean isQuery()
   {
     return dataSource instanceof QueryDataSource;
   }
+  
 
   /**
    * Returns true if this datasource is made out of a join operation
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/AppendableRowsAndColumns.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/AppendableRowsAndColumns.java
new file mode 100644
index 000000000000..55b197db6122
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/AppendableRowsAndColumns.java
@@ -0,0 +1,38 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import org.apache.druid.query.rowsandcols.column.Column;
+
+/**
+ * A RowsAndColumns that supports appending columns.  This interface is particularly useful because even if there is
+ * some composition of code that works with RowsAndColumns, we would like to add the columns to a singular base object
+ * instead of build up a complex object graph.
+ */
+public interface AppendableRowsAndColumns extends RowsAndColumns
+{
+  /**
+   * Mutates the RowsAndColumns by appending the requested Column.
+   *
+   * @param name   the name of the new column
+   * @param column the Column object representing the new column
+   */
+  void addColumn(String name, Column column);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumns.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumns.java
new file mode 100644
index 000000000000..3162cdfadbfb
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumns.java
@@ -0,0 +1,125 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.query.rowsandcols.column.ObjectColumnAccessorBase;
+import org.apache.druid.segment.RowAdapter;
+import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.column.RowSignature;
+
+import javax.annotation.Nullable;
+import java.util.ArrayList;
+import java.util.Collection;
+import java.util.Comparator;
+import java.util.Optional;
+import java.util.function.Function;
+
+public class ArrayListRowsAndColumns<RowType> implements RowsAndColumns
+{
+  private final ArrayList<RowType> rows;
+  private final RowAdapter<RowType> rowAdapter;
+  private final RowSignature rowSignature;
+
+  public ArrayListRowsAndColumns(
+      ArrayList<RowType> rows,
+      RowAdapter<RowType> rowAdapter,
+      RowSignature rowSignature
+  )
+  {
+    this.rows = rows;
+    this.rowAdapter = rowAdapter;
+    this.rowSignature = rowSignature;
+  }
+
+  @Override
+  public Collection<String> getColumnNames()
+  {
+    return rowSignature.getColumnNames();
+  }
+
+  @Override
+  public int numRows()
+  {
+    return rows.size();
+  }
+
+  @Override
+  @Nullable
+  public Column findColumn(String name)
+  {
+    if (!rowSignature.contains(name)) {
+      return null;
+    }
+
+    final Function<RowType, Object> adapterForValue = rowAdapter.columnFunction(name);
+    final Optional<ColumnType> maybeColumnType = rowSignature.getColumnType(name);
+    final ColumnType columnType = maybeColumnType.orElse(ColumnType.UNKNOWN_COMPLEX);
+    final Comparator<Object> comparator = Comparator.nullsFirst(columnType.getStrategy());
+
+    return new Column()
+    {
+      @Override
+      public ColumnAccessor toAccessor()
+      {
+        return new ObjectColumnAccessorBase()
+        {
+          @Override
+          protected Object getVal(int cell)
+          {
+            return adapterForValue.apply(rows.get(cell));
+          }
+
+          @Override
+          protected Comparator<Object> getComparator()
+          {
+            return comparator;
+          }
+
+          @Override
+          public ColumnType getType()
+          {
+            return columnType;
+          }
+
+          @Override
+          public int numRows()
+          {
+            return rows.size();
+          }
+        };
+      }
+
+      @Override
+      public <T> T as(Class<? extends T> clazz)
+      {
+        return null;
+      }
+    };
+  }
+
+  @Nullable
+  @Override
+  public <T> T as(Class<T> clazz)
+  {
+    return null;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/DefaultGroupPartitioner.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/DefaultGroupPartitioner.java
new file mode 100644
index 000000000000..96e559e358b2
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/DefaultGroupPartitioner.java
@@ -0,0 +1,75 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+
+import java.util.List;
+
+@SuppressWarnings("unused")
+public class DefaultGroupPartitioner implements GroupPartitioner
+{
+  private final RowsAndColumns rac;
+
+  public DefaultGroupPartitioner(
+      RowsAndColumns rac
+  )
+  {
+    this.rac = rac;
+  }
+
+  @Override
+  public int[] computeGroupings(List<String> columns)
+  {
+    int[] retVal = new int[rac.numRows()];
+
+    for (String column : columns) {
+      final Column theCol = rac.findColumn(column);
+      if (theCol == null) {
+        // The column doesn't exist.  In this case, we assume it's always the same value: null.  If it's always
+        // the same, then it doesn't impact grouping at all and can be entirely skipped.
+        continue;
+      }
+      final ColumnAccessor accessor = theCol.toAccessor();
+
+      int currGroup = 0;
+      int prevGroupVal = 0;
+      for (int i = 1; i < retVal.length; ++i) {
+        if (retVal[i] == prevGroupVal) {
+          int comparison = accessor.compareCells(i - 1, i);
+          if (comparison == 0) {
+            retVal[i] = currGroup;
+            continue;
+          } else if (comparison > 0) { // "greater than"
+            throw new ISE("Pre-sorted data required, rows[%s] and [%s] were not in order", i - 1, i);
+          } // the 3rd condition ("less than") means create a new group, so let it fall through
+        }
+
+        // We have a new group, so walk things forward.
+        prevGroupVal = retVal[i];
+        retVal[i] = ++currGroup;
+      }
+    }
+
+    return retVal;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/DefaultOnHeapAggregatable.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/DefaultOnHeapAggregatable.java
new file mode 100644
index 000000000000..83aa50aee8de
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/DefaultOnHeapAggregatable.java
@@ -0,0 +1,271 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.aggregation.Aggregator;
+import org.apache.druid.query.aggregation.AggregatorFactory;
+import org.apache.druid.query.dimension.DimensionSpec;
+import org.apache.druid.query.monomorphicprocessing.RuntimeShapeInspector;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.segment.BaseSingleValueDimensionSelector;
+import org.apache.druid.segment.ColumnSelectorFactory;
+import org.apache.druid.segment.ColumnValueSelector;
+import org.apache.druid.segment.DimensionSelector;
+import org.apache.druid.segment.column.ColumnCapabilities;
+import org.apache.druid.segment.column.ColumnCapabilitiesImpl;
+import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.serde.ComplexMetricSerde;
+import org.apache.druid.segment.serde.ComplexMetrics;
+
+import javax.annotation.Nonnull;
+import javax.annotation.Nullable;
+import java.util.ArrayList;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.concurrent.atomic.AtomicReference;
+import java.util.function.Function;
+
+public class DefaultOnHeapAggregatable implements OnHeapAggregatable, OnHeapCumulativeAggregatable
+{
+  private final RowsAndColumns rac;
+
+  public DefaultOnHeapAggregatable(
+      RowsAndColumns rac
+  )
+  {
+    this.rac = rac;
+  }
+
+  @Override
+  public ArrayList<Object> aggregateAll(
+      List<AggregatorFactory> aggFactories
+  )
+  {
+    Aggregator[] aggs = new Aggregator[aggFactories.size()];
+
+    AtomicInteger currRow = new AtomicInteger(0);
+    int index = 0;
+    for (AggregatorFactory aggFactory : aggFactories) {
+      aggs[index++] = aggFactory.factorize(new ColumnAccessorBasedColumnSelectorFactory(currRow));
+    }
+
+    int numRows = rac.numRows();
+    int rowId = currRow.get();
+    while (rowId < numRows) {
+      for (Aggregator agg : aggs) {
+        agg.aggregate();
+      }
+      rowId = currRow.incrementAndGet();
+    }
+
+    ArrayList<Object> retVal = new ArrayList<>(aggs.length);
+    for (Aggregator agg : aggs) {
+      retVal.add(agg.get());
+    }
+    return retVal;
+  }
+
+  @Override
+  public ArrayList<Object[]> aggregateCumulative(List<AggregatorFactory> aggFactories)
+  {
+    Aggregator[] aggs = new Aggregator[aggFactories.size()];
+    ArrayList<Object[]> retVal = new ArrayList<>(aggFactories.size());
+
+    int numRows = rac.numRows();
+    AtomicInteger currRow = new AtomicInteger(0);
+    int index = 0;
+    for (AggregatorFactory aggFactory : aggFactories) {
+      aggs[index++] = aggFactory.factorize(new ColumnAccessorBasedColumnSelectorFactory(currRow));
+      retVal.add(new Object[numRows]);
+    }
+
+    int rowId = currRow.get();
+    while (rowId < numRows) {
+      for (int i = 0; i < aggs.length; ++i) {
+        aggs[i].aggregate();
+        retVal.get(i)[rowId] = aggs[i].get();
+      }
+      rowId = currRow.incrementAndGet();
+    }
+
+    return retVal;
+  }
+
+  private class ColumnAccessorBasedColumnSelectorFactory implements ColumnSelectorFactory
+  {
+    private final Map<String, ColumnAccessor> accessorCache = new HashMap<>();
+
+    private final AtomicInteger cellIdSupplier;
+
+    public ColumnAccessorBasedColumnSelectorFactory(AtomicInteger cellIdSupplier)
+    {
+      this.cellIdSupplier = cellIdSupplier;
+    }
+
+    @Override
+    public DimensionSelector makeDimensionSelector(DimensionSpec dimensionSpec)
+    {
+      return withColumnAccessor(dimensionSpec.getDimension(), columnAccessor -> {
+        if (columnAccessor == null) {
+          return DimensionSelector.constant(null);
+        } else {
+          return new BaseSingleValueDimensionSelector()
+          {
+            @Nullable
+            @Override
+            protected String getValue()
+            {
+              return String.valueOf(columnAccessor.getObject(cellIdSupplier.get()));
+            }
+
+            @Override
+            public void inspectRuntimeShape(RuntimeShapeInspector inspector)
+            {
+
+            }
+          };
+        }
+      });
+    }
+
+    @SuppressWarnings("rawtypes")
+    @Override
+    public ColumnValueSelector makeColumnValueSelector(@Nonnull String columnName)
+    {
+      return withColumnAccessor(columnName, columnAccessor -> {
+        if (columnAccessor == null) {
+          return DimensionSelector.constant(null);
+        } else {
+          return new ColumnValueSelector()
+          {
+            private final AtomicReference<Class> myClazz = new AtomicReference<>(null);
+
+            @Nullable
+            @Override
+            public Object getObject()
+            {
+              return columnAccessor.getObject(cellIdSupplier.get());
+            }
+
+            @SuppressWarnings("rawtypes")
+            @Override
+            public Class classOfObject()
+            {
+              Class retVal = myClazz.get();
+              if (retVal == null) {
+                retVal = findClazz();
+                myClazz.set(retVal);
+              }
+              return retVal;
+            }
+
+            private Class findClazz()
+            {
+              final ColumnType type = columnAccessor.getType();
+              switch (type.getType()) {
+                case LONG:
+                  return long.class;
+                case DOUBLE:
+                  return double.class;
+                case FLOAT:
+                  return float.class;
+                case STRING:
+                  return String.class;
+                case ARRAY:
+                  return List.class;
+                case COMPLEX:
+                  final ComplexMetricSerde serdeForType = ComplexMetrics.getSerdeForType(type.getComplexTypeName());
+                  if (serdeForType != null && serdeForType.getObjectStrategy() != null) {
+                    return serdeForType.getObjectStrategy().getClazz();
+                  }
+
+                  for (int i = 0; i < columnAccessor.numRows(); ++i) {
+                    Object obj = columnAccessor.getObject(i);
+                    if (obj != null) {
+                      return obj.getClass();
+                    }
+                  }
+                  return Object.class;
+                default:
+                  throw new ISE("Unknown type[%s]", type.getType());
+              }
+            }
+
+            @Override
+            public boolean isNull()
+            {
+              return columnAccessor.isNull(cellIdSupplier.get());
+            }
+
+            @Override
+            public long getLong()
+            {
+              return columnAccessor.getLong(cellIdSupplier.get());
+            }
+
+            @Override
+            public float getFloat()
+            {
+              return columnAccessor.getFloat(cellIdSupplier.get());
+            }
+
+            @Override
+            public double getDouble()
+            {
+              return columnAccessor.getDouble(cellIdSupplier.get());
+            }
+
+            @Override
+            public void inspectRuntimeShape(RuntimeShapeInspector inspector)
+            {
+
+            }
+          };
+        }
+      });
+    }
+
+    @Nullable
+    @Override
+    public ColumnCapabilities getColumnCapabilities(String column)
+    {
+      return withColumnAccessor(column, columnAccessor ->
+          new ColumnCapabilitiesImpl()
+              .setType(columnAccessor.getType())
+              .setDictionaryEncoded(false)
+              .setHasBitmapIndexes(false));
+    }
+
+    private <T> T withColumnAccessor(String column, Function<ColumnAccessor, T> fn)
+    {
+      ColumnAccessor retVal = accessorCache.get(column);
+      if (retVal == null) {
+        Column racColumn = rac.findColumn(column);
+        retVal = racColumn == null ? null : racColumn.toAccessor();
+        accessorCache.put(column, retVal);
+      }
+      return fn.apply(retVal);
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/DefaultSortedGroupPartitioner.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/DefaultSortedGroupPartitioner.java
new file mode 100644
index 000000000000..1470ac2da06d
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/DefaultSortedGroupPartitioner.java
@@ -0,0 +1,93 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import it.unimi.dsi.fastutil.ints.IntArrayList;
+import it.unimi.dsi.fastutil.ints.IntList;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.operator.LimitedRowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+
+import java.util.ArrayList;
+import java.util.List;
+
+public class DefaultSortedGroupPartitioner implements SortedGroupPartitioner
+{
+  private final RowsAndColumns rac;
+
+  public DefaultSortedGroupPartitioner(
+      RowsAndColumns rac
+  )
+  {
+    this.rac = rac;
+  }
+
+  @Override
+  public int[] computeBoundaries(List<String> columns)
+  {
+    // Initialize to a grouping of everything
+    IntList boundaries = new IntArrayList(new int[]{0, rac.numRows()});
+
+    for (String column : columns) {
+      final Column theCol = rac.findColumn(column);
+      if (theCol == null) {
+        // The column doesn't exist.  In this case, we assume it's always the same value: null.  If it's always
+        // the same, then it doesn't impact grouping at all and can be entirely skipped.
+        continue;
+      }
+      final ColumnAccessor accessor = theCol.toAccessor();
+
+      IntList newBoundaries = new IntArrayList();
+      newBoundaries.add(0);
+      for (int i = 1; i < boundaries.size(); ++i) {
+        int start = boundaries.getInt(i - 1);
+        int end = boundaries.getInt(i);
+        for (int j = start + 1; j < end; ++j) {
+          int comparison = accessor.compareCells(j - 1, j);
+          if (comparison < 0) {
+            newBoundaries.add(j);
+          } else if (comparison > 0) {
+            throw new ISE("Pre-sorted data required, rows[%s] and [%s] were not in order", j - 1, j);
+          }
+        }
+        newBoundaries.add(end);
+      }
+      boundaries = newBoundaries;
+    }
+
+    return boundaries.toIntArray();
+  }
+
+  @Override
+  public ArrayList<RowsAndColumns> partitionOnBoundaries(List<String> partitionColumns)
+  {
+    final int[] boundaries = computeBoundaries(partitionColumns);
+    ArrayList<RowsAndColumns> retVal = new ArrayList<>(boundaries.length - 1);
+
+    for (int i = 1; i < boundaries.length; ++i) {
+      int start = boundaries[i - 1];
+      int end = boundaries[i];
+      retVal.add(new LimitedRowsAndColumns(rac, start, end));
+    }
+
+    return retVal;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/GroupPartitioner.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/GroupPartitioner.java
new file mode 100644
index 000000000000..e3bae9d4284e
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/GroupPartitioner.java
@@ -0,0 +1,43 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import java.util.List;
+
+/**
+ * A semantic interface used to partition a data set based on a given set of dimensions.
+ */
+@SuppressWarnings("unused")
+public interface GroupPartitioner
+{
+  /**
+   * Computes the groupings of the underlying rows based on the columns passed in for grouping.  The grouping is
+   * returned as an int[], the length of the array will be equal to the number of rows of data and the values of
+   * the elements of the array will be the same when the rows are part of the same group and different when the
+   * rows are part of different groups.  This is contrasted with the SortedGroupPartitioner in that, the
+   * groupings returned are not necessarily contiguous.  There is also no sort-order implied by the `int` values
+   * assigned to each grouping.
+   *
+   * @param columns the columns to group with
+   * @return the groupings, rows with the same int value are in the same group.  There is no sort-order implied by the
+   * int values.
+   */
+  int[] computeGroupings(List<String> columns);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/OnHeapAggregatable.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/OnHeapAggregatable.java
new file mode 100644
index 000000000000..9a707737a183
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/OnHeapAggregatable.java
@@ -0,0 +1,47 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import org.apache.druid.query.aggregation.AggregatorFactory;
+
+import java.util.ArrayList;
+import java.util.List;
+
+/**
+ * A semantic interface used to aggregate a list of AggregatorFactories across a given set of data
+ * <p>
+ * The aggregation specifically happens on-heap and should be used in places where it is known that the data
+ * set can be worked with entirely on-heap.
+ * <p>
+ * Note, as we implement frame-handling for window aggregations, it is expected that this interface will undergo a
+ * transformation.  It might be deleted and replaced with something else, or might just see a change done in place.
+ * Either way, there is no assumption of enforced compatibility with this interface at this point in time.
+ */
+public interface OnHeapAggregatable
+{
+  /**
+   * Aggregates the data using the {@code List<AggregatorFactory} objects.
+   *
+   * @param aggFactories definition of aggregations to be done
+   * @return a list of objects, one per AggregatorFactory.  That is, the length of the return list should be equal to
+   * the length of the aggFactories list passed as an argument
+   */
+  ArrayList<Object> aggregateAll(List<AggregatorFactory> aggFactories);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/OnHeapCumulativeAggregatable.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/OnHeapCumulativeAggregatable.java
new file mode 100644
index 000000000000..a931c3dbcab1
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/OnHeapCumulativeAggregatable.java
@@ -0,0 +1,48 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import org.apache.druid.query.aggregation.AggregatorFactory;
+
+import java.util.ArrayList;
+import java.util.List;
+
+/**
+ * A semantic interface used to cumulatively aggregate a list of AggregatorFactories across a given set of data
+ * <p>
+ * The aggregation specifically happens on-heap and should be used in places where it is known that the data
+ * set can be worked with entirely on-heap.
+ * <p>
+ * Note, as we implement frame-handling for window aggregations, it is expected that this interface will undergo a
+ * transformation.  It might be deleted and replaced with something else, or might just see a change done in place.
+ * Either way, there is no assumption of enforced compatibility with this interface at this point in time.
+ */
+public interface OnHeapCumulativeAggregatable
+{
+  /**
+   * Cumulatively aggregates the data using the {@code List<AggregatorFactory} objects.
+   *
+   * @param aggFactories definition of aggregations to be done
+   * @return a list of objects, one per AggregatorFactory.  That is, the length of the return list should be equal to
+   * the length of the aggFactories list passed as an argument, while the length of the internal {@code Object[]} will
+   * be equivalent to the number of rows
+   */
+  ArrayList<Object[]> aggregateCumulative(List<AggregatorFactory> aggFactories);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/RowsAndColumns.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/RowsAndColumns.java
new file mode 100644
index 000000000000..c42f5c0a9267
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/RowsAndColumns.java
@@ -0,0 +1,113 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.frame.AppendableMapOfColumns;
+
+import javax.annotation.Nonnull;
+import javax.annotation.Nullable;
+import java.util.Collection;
+
+/**
+ * An interface representing a chunk of RowsAndColumns.  Essentially a RowsAndColumns is just a batch of rows
+ * with columns.
+ * <p>
+ * This interface has very little prescriptively defined about what *must* be implemented.  This is intentional
+ * as there are lots of different possible representations of batch of rows each with their own unique positives
+ * and negatives when it comes to processing.  So, any explicit definition of what a RowsAndColumns is will actually,
+ * by definition, end up as optimal for one specific configuration and sub-optimal for others.  Instead of trying to
+ * explicitly expand the interface to cover all the different possible ways that someone could want to interace
+ * with a Rows and columns, we rely on semantic interfaces using the {@link RowsAndColumns#as} method instead.
+ * <p>
+ * That is, the expectation is that anything that works with a RowsAndColumns will tend to first ask the RowsAndColumns
+ * object to become some other interface, for example, an {@link OnHeapAggregatable}.  If a RowsAndColumns knows how
+ * to do a good job as the requested interface, it can return its own concrete implementation of the interface and
+ * run the necessary logic in its own optimized fashion.  If the RowsAndColumns instance does not know how to implement
+ * the semantic interface, it is expected that a default implementation of the interface can be instantiated on top of
+ * the default column access mechanisms that the RowsAndColumns provides.  Such default implementations should be
+ * functionally correct, but are not believed to be optimal.
+ * <p>
+ * The "default column access mechanisms" here amount to using {@link #findColumn} to load a Column
+ * and then using {@link Column#toAccessor} to access the individual cells of the column.  There is also a
+ * {@link Column#as} method which a default implementation might attempt to use to create a more optimal runtime.
+ * <p>
+ * It is intended that this interface can be used by Frames, Segments and even normal on-heap JVM data structures to
+ * participate in query operations.
+ */
+public interface RowsAndColumns
+{
+  @Nonnull
+  static AppendableRowsAndColumns expectAppendable(RowsAndColumns input)
+  {
+    if (input instanceof AppendableRowsAndColumns) {
+      return (AppendableRowsAndColumns) input;
+    }
+
+    AppendableRowsAndColumns retVal = input.as(AppendableRowsAndColumns.class);
+    if (retVal == null) {
+      retVal = new AppendableMapOfColumns(input);
+    }
+    return retVal;
+  }
+
+  /**
+   * The set of column names available from the RowsAndColumns
+   *
+   * @return The set of column names available from the RowsAndColumns
+   */
+  @SuppressWarnings("unreachable")
+  Collection<String> getColumnNames();
+
+  /**
+   * The number of rows in the RowsAndColumns object
+   *
+   * @return the integer number of rows
+   */
+  int numRows();
+
+  /**
+   * Finds a column by name.  null is returned if the column is not found.  The RowsAndColumns object should not
+   * attempt to default not-found columns to pretend as if they exist, instead the user of the RowsAndColumns object
+   * should decide the correct semantic interpretation of a column that does not exist.  It is expected that most
+   * locations will choose to believe that the column does exist and is always null, but there are often optimizations
+   * that can effect this same assumption without doing a lot of extra work if the calling code knows that it does not
+   * exist.
+   *
+   * @param name the name of the column to find
+   * @return the Column, if found.  null if not found.
+   */
+  Column findColumn(String name);
+
+  /**
+   * Asks the RowsAndColumns to return itself as a concrete implementation of a specific interface.  The interface
+   * asked for will tend to be a semantically-meaningful interface.  This method allows the calling code to interrogate
+   * the RowsAndColumns object about whether it can offer a meaningful optimization of the semantic interface.  If a
+   * RowsAndColumns cannot do anything specifically optimal for the interface requested, it should return null instead
+   * of trying to come up with its own default implementation.
+   *
+   * @param clazz A class object representing the interface that the calling code wants a concrete implementation of
+   * @param <T>   The interface that the calling code wants a concrete implementation of
+   * @return A concrete implementation of the interface, or null if there is no meaningful optimization to be had
+   * through a local implementation of the interface.
+   */
+  @Nullable
+  <T> T as(Class<T> clazz);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/SortedGroupPartitioner.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/SortedGroupPartitioner.java
new file mode 100644
index 000000000000..a60657937aef
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/SortedGroupPartitioner.java
@@ -0,0 +1,54 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import java.util.ArrayList;
+import java.util.List;
+
+/**
+ * A semantic interface used to partition a data set based on a given set of dimensions.
+ * <p>
+ * This specifically assumes that it is working with sorted data and, as such, the groups returned
+ * should be contiguous and unique (that is, all rows for a given combination of values exist in only one grouping)
+ */
+public interface SortedGroupPartitioner
+{
+  /**
+   * Computes and returns a list of contiguous boundaries for independent groups.  All rows in a specific grouping
+   * should have the same values for the identified columns.  Additionally, as this is assuming it is dealing with
+   * sorted data, there should only be a single entry in the return value for a given set of values of the columns.
+   *
+   * @param columns the columns to partition on
+   * @return an int[] representing the start (inclusive) and stop (exclusive) offsets of boundaries.  Boundaries are
+   * contiguous, so the stop of the previous boundary is the start of the subsequent one.
+   */
+  int[] computeBoundaries(List<String> columns);
+
+  /**
+   * Semantically equivalent to computeBoundaries, but returns a list of RowsAndColumns objects instead of just
+   * boundary positions.  This is useful as it allows the concrete implementation to return RowsAndColumns objects
+   * that are aware of the internal representation of the data and thus can provide optimized implementations of
+   * other semantic interfaces as the "child" RowsAndColumns are used
+   *
+   * @param partitionColumns the columns to partition on
+   * @return a list of RowsAndColumns representing the data grouped by the partition columns.
+   */
+  ArrayList<RowsAndColumns> partitionOnBoundaries(List<String> partitionColumns);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/column/Column.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/Column.java
new file mode 100644
index 000000000000..97327faf9ce6
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/Column.java
@@ -0,0 +1,63 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.column;
+
+import javax.annotation.Nonnull;
+
+/**
+ * An interface representing a Column of data.
+ *
+ * This interface prescribes that a {@link ColumnAccessor} must be defined on the column, but also offers an
+ * {@link #as} method to allow for optimized specific implementations of semantically meaningful logic.
+ *
+ * That is, the expectation is that some things work with Column objects might choose to first ask the Column
+ * object to become some other interface.  If the Column knows how to do a good job as the requested interface, it can
+ * return its own concrete implementation of the interface and run the necessary logic in its own optimized fashion.
+ * If the Column instance does not know how to implement the semantic interface, it is expected that the
+ * {@link ColumnAccessor} will be leveraged to implement whatever logic is required.
+ */
+public interface Column
+{
+  /**
+   * Returns the column as a {@link ColumnAccessor}.  Semantically, this would be equivalent to calling
+   * {@Code Column.as(ColumnAccessor.class)}.  However, being able to implement this interface is part of the explicit
+   * contract of implementing this interface, so instead of relying on {@link #as} which allows for returning null,
+   * we define a top-level method that should never return null.
+   *
+   * @return a {@link ColumnAccessor} representation of the column, this should never return null.
+   */
+  @Nonnull
+  ColumnAccessor toAccessor();
+
+  /**
+   * Asks the Column to return itself as a concrete implementation of a specific interface.  The interface
+   * asked for will tend to be a semantically-meaningful interface.  This method allows the calling code to interrogate
+   * the Column object about whether it can offer a meaningful optimization of the semantic interface.  If a
+   * Column cannot do anything specifically optimal for the interface requested, it should return null instead
+   * of trying to come up with its own default implementation.
+   *
+   * @param clazz A class object representing the interface that the calling code wants a concrete implementation of
+   * @param <T> The interface that the calling code wants a concrete implementation of
+   * @return A concrete implementation of the interface, or null if there is no meaningful optimization to be had
+   * through a local implementation of the interface.
+   */
+  @SuppressWarnings("unused")
+  <T> T as(Class<? extends T> clazz);
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ColumnAccessor.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ColumnAccessor.java
new file mode 100644
index 000000000000..acc6b5806d2f
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ColumnAccessor.java
@@ -0,0 +1,104 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.column;
+
+import org.apache.druid.segment.column.ColumnType;
+
+import javax.annotation.Nullable;
+
+/**
+ * Allows for accessing a column, provides methods to enable cell-by-cell access.
+ */
+public interface ColumnAccessor
+{
+  /**
+   * Get the type of the Column
+   *
+   * @return the type of the Column
+   */
+  ColumnType getType();
+
+  /**
+   * Get the number of cells
+   *
+   * @return the number of cells
+   */
+  int numRows();
+
+  /**
+   * Get whether the value of a cell is null
+   *
+   * @param rowNum the cell id, 0-indexed
+   * @return true if the value is null
+   */
+  boolean isNull(int rowNum);
+
+  /**
+   * Get the {@link Object} representation of the cell.
+   *
+   * @param rowNum the cell id, 0-indexed
+   * @return the {@link Object} representation of the cell.  Returns {@code null} If {@link #isNull} is true.
+   */
+  @Nullable
+  Object getObject(int rowNum);
+
+  /**
+   * Get the primitive {@code double} representation of the cell.
+   *
+   * @param rowNum the cell id, 0-indexed
+   * @return the primitive {@code double} representation of the cell.  Returns {@code 0D} If {@link #isNull} is true.
+   */
+  double getDouble(int rowNum);
+
+  /**
+   * Get the primitive {@code float} representation of the cell.
+   *
+   * @param rowNum the cell id, 0-indexed
+   * @return the primitive {@code float} representation of the cell.  Returns {@code 0F} If {@link #isNull} is true.
+   */
+  float getFloat(int rowNum);
+
+  /**
+   * Get the primitive {@code long} representation of the cell.
+   *
+   * @param rowNum the cell id, 0-indexed
+   * @return the primitive {@code long} representation of the cell.  Returns {@code 0L} If {@link #isNull} is true.
+   */
+  long getLong(int rowNum);
+
+  /**
+   * Get the primitive {@code int} representation of the cell.
+   *
+   * @param rowNum the cell id, 0-indexed
+   * @return the primitive {@code int} representation of the cell.  Returns {@code 0} If {@link #isNull} is true.
+   */
+  int getInt(int rowNum);
+
+  /**
+   * Compares two cells using a comparison that follows the same semantics as {@link java.util.Comparator#compare}
+   * <p>
+   * This is not comparing the cell Ids, but the values referred to by the cell ids.
+   *
+   * @param lhsRowNum the cell id of the left-hand-side of the comparison
+   * @param rhsRowNum the cell id of the right-hand-side of the comparison
+   * @return the result of the comparison of the two cells
+   */
+  int compareCells(int lhsRowNum, int rhsRowNum);
+}
diff --git a/processing/src/test/java/org/apache/druid/frame/write/FrameRowTooLargeExceptionTest.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ColumnAccessorBasedColumn.java
similarity index 67%
rename from processing/src/test/java/org/apache/druid/frame/write/FrameRowTooLargeExceptionTest.java
rename to processing/src/main/java/org/apache/druid/query/rowsandcols/column/ColumnAccessorBasedColumn.java
index 7c33ee098962..2e6a4a597cef 100644
--- a/processing/src/test/java/org/apache/druid/frame/write/FrameRowTooLargeExceptionTest.java
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ColumnAccessorBasedColumn.java
@@ -17,18 +17,28 @@
  * under the License.
  */
 
-package org.apache.druid.frame.write;
+package org.apache.druid.query.rowsandcols.column;
 
-import org.junit.Assert;
-import org.junit.Test;
-
-public class FrameRowTooLargeExceptionTest
+public class ColumnAccessorBasedColumn implements Column
 {
-  @Test
-  public void testBasic()
+  private final ColumnAccessor base;
+
+  public ColumnAccessorBasedColumn(
+      ColumnAccessor base
+  )
+  {
+    this.base = base;
+  }
+
+  @Override
+  public ColumnAccessor toAccessor()
+  {
+    return base;
+  }
+
+  @Override
+  public <T> T as(Class<? extends T> clazz)
   {
-    final int maxFrameSize = 1000;
-    final FrameRowTooLargeException e = new FrameRowTooLargeException(maxFrameSize);
-    Assert.assertEquals(maxFrameSize, e.getMaxFrameSize());
+    return null;
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ConstantObjectColumn.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ConstantObjectColumn.java
new file mode 100644
index 000000000000..09aad34692dd
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ConstantObjectColumn.java
@@ -0,0 +1,103 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.column;
+
+import org.apache.druid.segment.column.ColumnType;
+
+public class ConstantObjectColumn implements Column
+{
+  private final Object obj;
+  private final int numCells;
+  private final ColumnType type;
+
+  public ConstantObjectColumn(Object obj, int numCells, ColumnType type)
+  {
+    this.obj = obj;
+    this.numCells = numCells;
+    this.type = type;
+  }
+
+  @Override
+  public ColumnAccessor toAccessor()
+  {
+    return new ColumnAccessor()
+    {
+      @Override
+      public ColumnType getType()
+      {
+        return type;
+      }
+
+      @Override
+      public int numRows()
+      {
+        return numCells;
+      }
+
+      @Override
+      public boolean isNull(int rowNum)
+      {
+        return obj == null;
+      }
+
+      @Override
+      public Object getObject(int rowNum)
+      {
+        return obj;
+      }
+
+      @Override
+      public double getDouble(int rowNum)
+      {
+        return ((Number) obj).doubleValue();
+      }
+
+      @Override
+      public float getFloat(int rowNum)
+      {
+        return ((Number) obj).floatValue();
+      }
+
+      @Override
+      public long getLong(int rowNum)
+      {
+        return ((Number) obj).longValue();
+      }
+
+      @Override
+      public int getInt(int rowNum)
+      {
+        return ((Number) obj).intValue();
+      }
+
+      @Override
+      public int compareCells(int lhsRowNum, int rhsRowNum)
+      {
+        return 0;
+      }
+    };
+  }
+
+  @Override
+  public <T> T as(Class<? extends T> clazz)
+  {
+    return null;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/column/DoubleArrayColumn.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/DoubleArrayColumn.java
new file mode 100644
index 000000000000..c2d7547be129
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/DoubleArrayColumn.java
@@ -0,0 +1,101 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.column;
+
+import org.apache.druid.segment.column.ColumnType;
+
+public class DoubleArrayColumn implements Column
+{
+  private final double[] vals;
+
+  public DoubleArrayColumn(
+      double[] vals
+  )
+  {
+    this.vals = vals;
+  }
+
+  @Override
+  public ColumnAccessor toAccessor()
+  {
+    return new ColumnAccessor()
+    {
+      @Override
+      public ColumnType getType()
+      {
+        return ColumnType.DOUBLE;
+      }
+
+      @Override
+      public int numRows()
+      {
+        return vals.length;
+      }
+
+      @Override
+      public boolean isNull(int rowNum)
+      {
+        return false;
+      }
+
+      @Override
+      public Object getObject(int rowNum)
+      {
+        return vals[rowNum];
+      }
+
+      @Override
+      public double getDouble(int rowNum)
+      {
+        return vals[rowNum];
+      }
+
+      @Override
+      public float getFloat(int rowNum)
+      {
+        return (float) vals[rowNum];
+      }
+
+      @Override
+      public long getLong(int rowNum)
+      {
+        return (long) vals[rowNum];
+      }
+
+      @Override
+      public int getInt(int rowNum)
+      {
+        return (int) vals[rowNum];
+      }
+
+      @Override
+      public int compareCells(int lhsRowNum, int rhsRowNum)
+      {
+        return Double.compare(lhsRowNum, rhsRowNum);
+      }
+    };
+  }
+
+  @Override
+  public <T> T as(Class<? extends T> clazz)
+  {
+    return null;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/column/IntArrayColumn.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/IntArrayColumn.java
new file mode 100644
index 000000000000..10f70351efaa
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/IntArrayColumn.java
@@ -0,0 +1,101 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.column;
+
+import org.apache.druid.segment.column.ColumnType;
+
+public class IntArrayColumn implements Column
+{
+  private final int[] vals;
+
+  public IntArrayColumn(
+      int[] vals
+  )
+  {
+    this.vals = vals;
+  }
+
+  @Override
+  public ColumnAccessor toAccessor()
+  {
+    return new ColumnAccessor()
+    {
+      @Override
+      public ColumnType getType()
+      {
+        return ColumnType.LONG;
+      }
+
+      @Override
+      public int numRows()
+      {
+        return vals.length;
+      }
+
+      @Override
+      public boolean isNull(int rowNum)
+      {
+        return false;
+      }
+
+      @Override
+      public Object getObject(int rowNum)
+      {
+        return vals[rowNum];
+      }
+
+      @Override
+      public double getDouble(int rowNum)
+      {
+        return vals[rowNum];
+      }
+
+      @Override
+      public float getFloat(int rowNum)
+      {
+        return vals[rowNum];
+      }
+
+      @Override
+      public long getLong(int rowNum)
+      {
+        return vals[rowNum];
+      }
+
+      @Override
+      public int getInt(int rowNum)
+      {
+        return vals[rowNum];
+      }
+
+      @Override
+      public int compareCells(int lhsRowNum, int rhsRowNum)
+      {
+        return Integer.compare(vals[lhsRowNum], vals[rhsRowNum]);
+      }
+    };
+  }
+
+  @Override
+  public <T> T as(Class<? extends T> clazz)
+  {
+    return null;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/column/NullColumnAccessor.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/NullColumnAccessor.java
new file mode 100644
index 000000000000..ea876c3e1478
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/NullColumnAccessor.java
@@ -0,0 +1,96 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.column;
+
+import org.apache.druid.segment.column.ColumnType;
+
+import javax.annotation.Nullable;
+
+public class NullColumnAccessor implements ColumnAccessor
+{
+  private final ColumnType type;
+  private final int size;
+
+  public NullColumnAccessor(int size)
+  {
+    this(ColumnType.UNKNOWN_COMPLEX, size);
+  }
+
+  public NullColumnAccessor(ColumnType type, int size)
+  {
+    this.type = type;
+    this.size = size;
+  }
+
+  @Override
+  public ColumnType getType()
+  {
+    return type;
+  }
+
+  @Override
+  public int numRows()
+  {
+    return size;
+  }
+
+  @Override
+  public boolean isNull(int rowNum)
+  {
+    return true;
+  }
+
+  @Nullable
+  @Override
+  public Object getObject(int rowNum)
+  {
+    return null;
+  }
+
+  @Override
+  public double getDouble(int rowNum)
+  {
+    return 0;
+  }
+
+  @Override
+  public float getFloat(int rowNum)
+  {
+    return 0;
+  }
+
+  @Override
+  public long getLong(int rowNum)
+  {
+    return 0;
+  }
+
+  @Override
+  public int getInt(int rowNum)
+  {
+    return 0;
+  }
+
+  @Override
+  public int compareCells(int lhsRowNum, int rhsRowNum)
+  {
+    return 0;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ObjectArrayColumn.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ObjectArrayColumn.java
new file mode 100644
index 000000000000..fd850a0956d0
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ObjectArrayColumn.java
@@ -0,0 +1,81 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.column;
+
+import org.apache.druid.segment.column.ColumnType;
+
+import java.util.Comparator;
+
+public class ObjectArrayColumn implements Column
+{
+  private final Object[] objects;
+  private final ColumnType resultType;
+  private final Comparator<Object> comparator;
+
+  public ObjectArrayColumn(Object[] objects, ColumnType resultType)
+  {
+    this(objects, resultType, Comparator.nullsFirst(resultType.getStrategy()));
+  }
+
+  public ObjectArrayColumn(Object[] objects, ColumnType resultType, Comparator<Object> comparator)
+  {
+    this.objects = objects;
+    this.resultType = resultType;
+    this.comparator = comparator;
+  }
+
+  @Override
+  public ColumnAccessor toAccessor()
+  {
+    return new ObjectColumnAccessorBase()
+    {
+      @Override
+      protected Object getVal(int cell)
+      {
+        return objects[cell];
+      }
+
+      @Override
+      protected Comparator<Object> getComparator()
+      {
+        return comparator;
+      }
+
+      @Override
+      public ColumnType getType()
+      {
+        return resultType;
+      }
+
+      @Override
+      public int numRows()
+      {
+        return objects.length;
+      }
+    };
+  }
+
+  @Override
+  public <T> T as(Class<? extends T> clazz)
+  {
+    return null;
+  }
+
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ObjectColumnAccessorBase.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ObjectColumnAccessorBase.java
new file mode 100644
index 000000000000..8ef2aeae1196
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/column/ObjectColumnAccessorBase.java
@@ -0,0 +1,121 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.column;
+
+import javax.annotation.Nullable;
+import java.util.Comparator;
+
+public abstract class ObjectColumnAccessorBase implements ColumnAccessor
+{
+  @Override
+  public boolean isNull(int rowNum)
+  {
+    return getVal(rowNum) == null;
+  }
+
+  @Nullable
+  @Override
+  public Object getObject(int rowNum)
+  {
+    return getVal(rowNum);
+  }
+
+  @Override
+  public double getDouble(int rowNum)
+  {
+    final Object val = getVal(rowNum);
+    if (val instanceof Number) {
+      return ((Number) val).doubleValue();
+    } else if (val instanceof String) {
+      try {
+        return Double.parseDouble((String) val);
+      }
+      catch (NumberFormatException e) {
+        return 0d;
+      }
+    } else {
+      return 0d;
+    }
+  }
+
+  @Override
+  public float getFloat(int rowNum)
+  {
+    final Object val = getVal(rowNum);
+    if (val instanceof Number) {
+      return ((Number) val).floatValue();
+    } else if (val instanceof String) {
+      try {
+        return Float.parseFloat((String) val);
+      }
+      catch (NumberFormatException e) {
+        return 0f;
+      }
+    } else {
+      return 0f;
+    }
+  }
+
+  @Override
+  public long getLong(int rowNum)
+  {
+    final Object val = getVal(rowNum);
+    if (val instanceof Number) {
+      return ((Number) val).longValue();
+    } else if (val instanceof String) {
+      try {
+        return Long.parseLong((String) val);
+      }
+      catch (NumberFormatException e) {
+        return 0L;
+      }
+    } else {
+      return 0L;
+    }
+  }
+
+  @Override
+  public int getInt(int rowNum)
+  {
+    final Object val = getVal(rowNum);
+    if (val instanceof Number) {
+      return ((Number) val).intValue();
+    } else if (val instanceof String) {
+      try {
+        return Integer.parseInt((String) val);
+      }
+      catch (NumberFormatException e) {
+        return 0;
+      }
+    } else {
+      return 0;
+    }
+  }
+
+  @Override
+  public int compareCells(int lhsRowNum, int rhsRowNum)
+  {
+    return getComparator().compare(getVal(lhsRowNum), getVal(rhsRowNum));
+  }
+
+  protected abstract Object getVal(int cell);
+
+  protected abstract Comparator<Object> getComparator();
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/frame/AppendableMapOfColumns.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/frame/AppendableMapOfColumns.java
new file mode 100644
index 000000000000..60a8d9fa5310
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/frame/AppendableMapOfColumns.java
@@ -0,0 +1,93 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.frame;
+
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.rowsandcols.AppendableRowsAndColumns;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+
+import java.util.Collection;
+import java.util.LinkedHashMap;
+import java.util.LinkedHashSet;
+import java.util.Set;
+
+public class AppendableMapOfColumns implements AppendableRowsAndColumns
+{
+  private final RowsAndColumns base;
+  private final LinkedHashMap<String, Column> appendedColumns;
+  private Set<String> colNames = null;
+
+  public AppendableMapOfColumns(
+      RowsAndColumns base
+  )
+  {
+    this.base = base;
+    this.appendedColumns = new LinkedHashMap<>();
+  }
+
+  @Override
+  public void addColumn(String name, Column column)
+  {
+    final Column prevValue = appendedColumns.put(name, column);
+    if (prevValue != null) {
+      throw new ISE("Tried to override column[%s]!?  Was[%s], now[%s]", name, prevValue, column);
+    }
+    if (colNames != null) {
+      colNames.add(name);
+    }
+  }
+
+  @Override
+  public Collection<String> getColumnNames()
+  {
+    if (colNames == null) {
+      this.colNames = new LinkedHashSet<>(base.getColumnNames());
+      this.colNames.addAll(appendedColumns.keySet());
+    }
+    return colNames;
+  }
+
+  @Override
+  public int numRows()
+  {
+    return base.numRows();
+  }
+
+  @Override
+  public Column findColumn(String name)
+  {
+    Column retVal = base.findColumn(name);
+    if (retVal == null) {
+      retVal = appendedColumns.get(name);
+    }
+    return retVal;
+  }
+
+  @Override
+  @SuppressWarnings("unchecked")
+  public <T> T as(Class<T> clazz)
+  {
+    if (AppendableRowsAndColumns.class.equals(clazz)) {
+      return (T) this;
+    }
+    return null;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/query/rowsandcols/frame/MapOfColumnsRowsAndColumns.java b/processing/src/main/java/org/apache/druid/query/rowsandcols/frame/MapOfColumnsRowsAndColumns.java
new file mode 100644
index 000000000000..aee614b51422
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/query/rowsandcols/frame/MapOfColumnsRowsAndColumns.java
@@ -0,0 +1,109 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.frame;
+
+import com.google.common.collect.ImmutableMap;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.rowsandcols.AppendableRowsAndColumns;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+
+import java.util.Iterator;
+import java.util.Map;
+import java.util.Set;
+
+public class MapOfColumnsRowsAndColumns implements RowsAndColumns
+{
+  public static MapOfColumnsRowsAndColumns of(String name, Column col)
+  {
+    return fromMap(ImmutableMap.of(name, col));
+  }
+
+  public static MapOfColumnsRowsAndColumns of(String name, Column col, String name2, Column col2)
+  {
+    return fromMap(ImmutableMap.of(name, col, name2, col2));
+  }
+
+  public static MapOfColumnsRowsAndColumns fromMap(Map<String, Column> map)
+  {
+    if (map == null || map.isEmpty()) {
+      throw new ISE("map[%s] cannot be null or empty.", map);
+    }
+
+    final Iterator<Map.Entry<String, Column>> iter = map.entrySet().iterator();
+    Map.Entry<String, Column> entry = iter.next();
+    int numCells = entry.getValue().toAccessor().numRows();
+    if (iter.hasNext()) {
+      entry = iter.next();
+      final int newCells = entry.getValue().toAccessor().numRows();
+      if (numCells != newCells) {
+        throw new ISE(
+            "Mismatched numCells, expectedNumCells[%s], actual[%s] from col[%s].",
+            numCells,
+            newCells,
+            entry.getKey()
+        );
+      }
+    }
+
+    return new MapOfColumnsRowsAndColumns(map, map.values().iterator().next().toAccessor().numRows());
+  }
+
+  private final Map<String, Column> mapOfColumns;
+  private final int numRows;
+
+  public MapOfColumnsRowsAndColumns(
+      Map<String, Column> mapOfColumns,
+      int numRows
+  )
+  {
+    this.mapOfColumns = mapOfColumns;
+    this.numRows = numRows;
+  }
+
+  @Override
+  public Set<String> getColumnNames()
+  {
+    return mapOfColumns.keySet();
+  }
+
+  @Override
+  public int numRows()
+  {
+    return numRows;
+  }
+
+  @Override
+  public Column findColumn(String name)
+  {
+    return mapOfColumns.get(name);
+  }
+
+  @Override
+  @SuppressWarnings("unchecked")
+  public <T> T as(Class<T> clazz)
+  {
+    if (AppendableRowsAndColumns.class.equals(clazz)) {
+      return (T) new AppendableMapOfColumns(this);
+    }
+    return null;
+  }
+
+}
diff --git a/processing/src/main/java/org/apache/druid/query/search/DefaultSearchQueryMetrics.java b/processing/src/main/java/org/apache/druid/query/search/DefaultSearchQueryMetrics.java
index 2481eeb35f26..eeb9b976a99f 100644
--- a/processing/src/main/java/org/apache/druid/query/search/DefaultSearchQueryMetrics.java
+++ b/processing/src/main/java/org/apache/druid/query/search/DefaultSearchQueryMetrics.java
@@ -303,6 +303,24 @@ public QueryMetrics reportParallelMergeTotalCpuTime(long timeNs)
     return delegateQueryMetrics.reportParallelMergeTotalCpuTime(timeNs);
   }
 
+  @Override
+  public QueryMetrics reportParallelMergeTotalTime(long timeNs)
+  {
+    return delegateQueryMetrics.reportParallelMergeTotalTime(timeNs);
+  }
+
+  @Override
+  public QueryMetrics reportParallelMergeFastestPartitionTime(long timeNs)
+  {
+    return delegateQueryMetrics.reportParallelMergeFastestPartitionTime(timeNs);
+  }
+
+  @Override
+  public QueryMetrics reportParallelMergeSlowestPartitionTime(long timeNs)
+  {
+    return delegateQueryMetrics.reportParallelMergeSlowestPartitionTime(timeNs);
+  }
+
   @Override
   public QueryMetrics reportQueriedSegmentCount(long segmentCount)
   {
diff --git a/processing/src/main/java/org/apache/druid/segment/ArrayListSegment.java b/processing/src/main/java/org/apache/druid/segment/ArrayListSegment.java
new file mode 100644
index 000000000000..97fe80341616
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/segment/ArrayListSegment.java
@@ -0,0 +1,126 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment;
+
+import com.google.common.base.Preconditions;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.guava.Sequences;
+import org.apache.druid.query.rowsandcols.ArrayListRowsAndColumns;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.segment.column.RowSignature;
+import org.apache.druid.timeline.SegmentId;
+import org.joda.time.Interval;
+
+import javax.annotation.Nonnull;
+import javax.annotation.Nullable;
+import java.util.ArrayList;
+
+/**
+ * A {@link Segment} that is based on a stream of objects.
+ */
+public class ArrayListSegment<RowType> implements Segment
+{
+  private final SegmentId segmentId;
+  private final ArrayList<RowType> rows;
+  private final RowAdapter<RowType> rowAdapter;
+  private final RowSignature rowSignature;
+
+  /**
+   * Create a list-based segment.
+   * <p>
+   * The provided List must be in time-order according to the provided {@link RowAdapter#timestampFunction()}.
+   * The cursor returned by {@link RowBasedStorageAdapter#makeCursors} makes no attempt to verify this, and callers
+   * will expect it.
+   * <p>
+   * The provided "rowSignature" will be used for reporting available columns and their capabilities to users of
+   * {@link #asStorageAdapter()}. Note that the {@link ColumnSelectorFactory} implementation returned by this segment's
+   * storage adapter will allow creation of selectors on any field, using the {@link RowAdapter#columnFunction} for that
+   * field, even if it doesn't appear in "rowSignature".
+   *
+   * @param segmentId    segment identifier; will be returned by {@link #getId()}
+   * @param rows         objects that comprise this segment. Must be re-iterable if support for {@link Cursor#reset()}
+   *                     is required. Otherwise, does not need to be re-iterable.
+   * @param rowAdapter   adapter used for reading these objects
+   * @param rowSignature signature of the columns in these objects
+   */
+  public ArrayListSegment(
+      final SegmentId segmentId,
+      final ArrayList<RowType> rows,
+      final RowAdapter<RowType> rowAdapter,
+      final RowSignature rowSignature
+  )
+  {
+    this.segmentId = Preconditions.checkNotNull(segmentId, "segmentId");
+    this.rows = rows;
+    this.rowAdapter = rowAdapter;
+    this.rowSignature = rowSignature;
+  }
+
+  @Override
+  @Nonnull
+  public SegmentId getId()
+  {
+    return segmentId;
+  }
+
+  @Override
+  @Nonnull
+  public Interval getDataInterval()
+  {
+    return Intervals.ETERNITY;
+  }
+
+  @Nullable
+  @Override
+  public QueryableIndex asQueryableIndex()
+  {
+    return null;
+  }
+
+  @Override
+  @Nonnull
+  public StorageAdapter asStorageAdapter()
+  {
+    return new RowBasedStorageAdapter<>(Sequences.simple(rows), rowAdapter, rowSignature);
+  }
+
+  @Nullable
+  @Override
+  @SuppressWarnings("unchecked")
+  public <T> T as(Class<T> clazz)
+  {
+    if (RowsAndColumns.class.equals(clazz)) {
+      return (T) asRowsAndColumns();
+    }
+    return null;
+  }
+
+  @Override
+  public void close()
+  {
+    // Do nothing.
+  }
+
+  private RowsAndColumns asRowsAndColumns()
+  {
+    return new ArrayListRowsAndColumns(rows, rowAdapter, rowSignature);
+  }
+
+}
diff --git a/processing/src/main/java/org/apache/druid/segment/BaseSingleValueDimensionSelector.java b/processing/src/main/java/org/apache/druid/segment/BaseSingleValueDimensionSelector.java
index adb0ecd1e6e7..c864e6abbc25 100644
--- a/processing/src/main/java/org/apache/druid/segment/BaseSingleValueDimensionSelector.java
+++ b/processing/src/main/java/org/apache/druid/segment/BaseSingleValueDimensionSelector.java
@@ -50,7 +50,6 @@ public int getValueCardinality()
   @Override
   public String lookupName(int id)
   {
-    assert id == 0;
     return getValue();
   }
 
diff --git a/processing/src/main/java/org/apache/druid/segment/Segment.java b/processing/src/main/java/org/apache/druid/segment/Segment.java
index 245c776b0aca..104216f38c90 100644
--- a/processing/src/main/java/org/apache/druid/segment/Segment.java
+++ b/processing/src/main/java/org/apache/druid/segment/Segment.java
@@ -23,6 +23,7 @@
 import org.apache.druid.timeline.SegmentId;
 import org.joda.time.Interval;
 
+import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
 import java.io.Closeable;
 
@@ -57,9 +58,9 @@ public interface Segment extends Closeable
    * @param <T> desired interface
    * @return instance of clazz, or null if the interface is not supported by this segment
    */
-  @SuppressWarnings("unused")
+  @SuppressWarnings({"unused", "unchecked"})
   @Nullable
-  default <T> T as(Class<T> clazz)
+  default <T> T as(@Nonnull Class<T> clazz)
   {
     if (clazz.equals(QueryableIndex.class)) {
       return (T) asQueryableIndex();
diff --git a/processing/src/main/java/org/apache/druid/segment/UnnestColumnValueSelectorCursor.java b/processing/src/main/java/org/apache/druid/segment/UnnestColumnValueSelectorCursor.java
new file mode 100644
index 000000000000..db4acb893ea0
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/segment/UnnestColumnValueSelectorCursor.java
@@ -0,0 +1,336 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment;
+
+import org.apache.druid.java.util.common.UOE;
+import org.apache.druid.query.BaseQuery;
+import org.apache.druid.query.dimension.DimensionSpec;
+import org.apache.druid.query.monomorphicprocessing.RuntimeShapeInspector;
+import org.apache.druid.segment.column.ColumnCapabilities;
+import org.apache.druid.segment.column.ColumnCapabilitiesImpl;
+import org.joda.time.DateTime;
+
+import javax.annotation.Nullable;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.LinkedHashSet;
+import java.util.List;
+
+/**
+ * The cursor to help unnest MVDs without dictionary encoding and ARRAY type selectors.
+ * <p>
+ * Consider a segment has 2 rows
+ * ['a', 'b', 'c']
+ * ['d', 'e']
+ * <p>
+ * The baseCursor points to the row ['a', 'b', 'c']
+ * while the unnestCursor with each call of advance() moves over individual elements.
+ * <p>
+ * unnestCursor.advance() -> 'a'
+ * unnestCursor.advance() -> 'b'
+ * unnestCursor.advance() -> 'c'
+ * unnestCursor.advance() -> 'd' (advances base cursor first)
+ * unnestCursor.advance() -> 'e'
+ * <p>
+ * <p>
+ * The allowSet if available helps skip over elements which are not in the allowList by moving the cursor to
+ * the next available match.
+ * <p>
+ * The index reference points to the index of each row that the unnest cursor is accessing through currentVal
+ * The index ranges from 0 to the size of the list in each row which is held in the unnestListForCurrentRow
+ * <p>
+ * The needInitialization flag sets up the initial values of unnestListForCurrentRow at the beginning of the segment
+ */
+public class UnnestColumnValueSelectorCursor implements Cursor
+{
+  private final Cursor baseCursor;
+  private final ColumnSelectorFactory baseColumnSelectorFactory;
+  private final ColumnValueSelector columnValueSelector;
+  private final String columnName;
+  private final String outputName;
+  private final LinkedHashSet<String> allowSet;
+  private int index;
+  private Object currentVal;
+  private List<Object> unnestListForCurrentRow;
+  private boolean needInitialization;
+
+  public UnnestColumnValueSelectorCursor(
+      Cursor cursor,
+      ColumnSelectorFactory baseColumSelectorFactory,
+      String columnName,
+      String outputColumnName,
+      LinkedHashSet<String> allowSet
+  )
+  {
+    this.baseCursor = cursor;
+    this.baseColumnSelectorFactory = baseColumSelectorFactory;
+    this.columnValueSelector = this.baseColumnSelectorFactory.makeColumnValueSelector(columnName);
+    this.columnName = columnName;
+    this.index = 0;
+    this.outputName = outputColumnName;
+    this.needInitialization = true;
+    this.allowSet = allowSet;
+  }
+
+  @Override
+  public ColumnSelectorFactory getColumnSelectorFactory()
+  {
+    return new ColumnSelectorFactory()
+    {
+      @Override
+      public DimensionSelector makeDimensionSelector(DimensionSpec dimensionSpec)
+      {
+        if (!outputName.equals(dimensionSpec.getDimension())) {
+          return baseColumnSelectorFactory.makeDimensionSelector(dimensionSpec);
+        }
+        throw new UOE("Unsupported dimension selector while using column value selector for column [%s]", outputName);
+      }
+
+      @Override
+      public ColumnValueSelector makeColumnValueSelector(String columnName)
+      {
+        if (!outputName.equals(columnName)) {
+          return baseColumnSelectorFactory.makeColumnValueSelector(columnName);
+        }
+        return new ColumnValueSelector()
+        {
+          @Override
+          public double getDouble()
+          {
+            Object value = getObject();
+            if (value == null) {
+              return 0;
+            }
+            if (value instanceof Number) {
+              return ((Number) value).doubleValue();
+            }
+            throw new UOE("Cannot convert object to double");
+          }
+
+          @Override
+          public float getFloat()
+          {
+            Object value = getObject();
+            if (value == null) {
+              return 0;
+            }
+            if (value instanceof Number) {
+              return ((Number) value).floatValue();
+            }
+            throw new UOE("Cannot convert object to float");
+          }
+
+          @Override
+          public long getLong()
+          {
+            Object value = getObject();
+            if (value == null) {
+              return 0;
+            }
+            if (value instanceof Number) {
+              return ((Number) value).longValue();
+            }
+            throw new UOE("Cannot convert object to long");
+          }
+
+          @Override
+          public void inspectRuntimeShape(RuntimeShapeInspector inspector)
+          {
+            columnValueSelector.inspectRuntimeShape(inspector);
+          }
+
+          @Override
+          public boolean isNull()
+          {
+            return getObject() == null;
+          }
+
+          @Nullable
+          @Override
+          public Object getObject()
+          {
+            if (!unnestListForCurrentRow.isEmpty()) {
+              if (allowSet == null || allowSet.isEmpty()) {
+                return unnestListForCurrentRow.get(index);
+              } else if (allowSet.contains((String) unnestListForCurrentRow.get(index))) {
+                return unnestListForCurrentRow.get(index);
+              }
+            }
+            return null;
+          }
+
+          @Override
+          public Class<?> classOfObject()
+          {
+            return Object.class;
+          }
+        };
+      }
+
+      @Nullable
+      @Override
+      public ColumnCapabilities getColumnCapabilities(String column)
+      {
+        if (!outputName.equals(column)) {
+          return baseColumnSelectorFactory.getColumnCapabilities(column);
+        }
+        final ColumnCapabilities capabilities = baseColumnSelectorFactory.getColumnCapabilities(columnName);
+        if (capabilities.isArray()) {
+          return ColumnCapabilitiesImpl.copyOf(capabilities).setType(capabilities.getElementType());
+        }
+        if (capabilities.hasMultipleValues().isTrue()) {
+          return ColumnCapabilitiesImpl.copyOf(capabilities).setHasMultipleValues(false);
+        }
+        return baseColumnSelectorFactory.getColumnCapabilities(columnName);
+      }
+    };
+  }
+
+  @Override
+  public DateTime getTime()
+  {
+    return baseCursor.getTime();
+  }
+
+  @Override
+  public void advance()
+  {
+    advanceUninterruptibly();
+    BaseQuery.checkInterrupted();
+  }
+
+  @Override
+  public void advanceUninterruptibly()
+  {
+    do {
+      advanceAndUpdate();
+    } while (matchAndProceed());
+  }
+
+  @Override
+  public boolean isDone()
+  {
+    if (needInitialization && !baseCursor.isDone()) {
+      initialize();
+    }
+    return baseCursor.isDone();
+  }
+
+  @Override
+  public boolean isDoneOrInterrupted()
+  {
+    if (needInitialization && !baseCursor.isDoneOrInterrupted()) {
+      initialize();
+    }
+    return baseCursor.isDoneOrInterrupted();
+  }
+
+  @Override
+  public void reset()
+  {
+    index = 0;
+    needInitialization = true;
+    baseCursor.reset();
+  }
+
+  /**
+   * This method populates the objects when the base cursor moves to the next row
+   *
+   * @param firstRun flag to populate one time object references to hold values for unnest cursor
+   */
+  private void getNextRow(boolean firstRun)
+  {
+    currentVal = this.columnValueSelector.getObject();
+    if (currentVal == null) {
+      if (!firstRun) {
+        unnestListForCurrentRow = new ArrayList<>();
+      }
+      unnestListForCurrentRow.add(null);
+    } else {
+      if (currentVal instanceof List) {
+        unnestListForCurrentRow = (List<Object>) currentVal;
+      } else if (currentVal instanceof Object[]) {
+        unnestListForCurrentRow = Arrays.asList((Object[]) currentVal);
+      } else if (currentVal.getClass().equals(String.class)) {
+        if (!firstRun) {
+          unnestListForCurrentRow = new ArrayList<>();
+        }
+        unnestListForCurrentRow.add(currentVal);
+      }
+    }
+  }
+
+  /**
+   * This initializes the unnest cursor and creates data structures
+   * to start iterating over the values to be unnested.
+   * This would also create a bitset for dictonary encoded columns to
+   * check for matching values specified in allowedList of UnnestDataSource.
+   */
+  private void initialize()
+  {
+    this.unnestListForCurrentRow = new ArrayList<>();
+    getNextRow(needInitialization);
+    if (allowSet != null) {
+      if (!allowSet.isEmpty()) {
+        if (!allowSet.contains((String) unnestListForCurrentRow.get(index))) {
+          advance();
+        }
+      }
+    }
+    needInitialization = false;
+  }
+
+  /**
+   * This advances the cursor to move to the next element to be unnested.
+   * When the last element in a row is unnested, it is also responsible
+   * to move the base cursor to the next row for unnesting and repopulates
+   * the data structures, created during initialize(), to point to the new row
+   */
+  private void advanceAndUpdate()
+  {
+    if (unnestListForCurrentRow.isEmpty() || index >= unnestListForCurrentRow.size() - 1) {
+      index = 0;
+      baseCursor.advance();
+      if (!baseCursor.isDone()) {
+        getNextRow(needInitialization);
+      }
+    } else {
+      index++;
+    }
+  }
+
+  /**
+   * This advances the unnest cursor in cases where an allowList is specified
+   * and the current value at the unnest cursor is not in the allowList.
+   * The cursor in such cases is moved till the next match is found.
+   *
+   * @return a boolean to indicate whether to stay or move cursor
+   */
+  private boolean matchAndProceed()
+  {
+    boolean matchStatus;
+    if (allowSet == null || allowSet.isEmpty()) {
+      matchStatus = true;
+    } else {
+      matchStatus = allowSet.contains((String) unnestListForCurrentRow.get(index));
+    }
+    return !baseCursor.isDone() && !matchStatus;
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/segment/UnnestDimensionCursor.java b/processing/src/main/java/org/apache/druid/segment/UnnestDimensionCursor.java
new file mode 100644
index 000000000000..46a2c626caf5
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/segment/UnnestDimensionCursor.java
@@ -0,0 +1,415 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment;
+
+import com.google.common.base.Predicate;
+import org.apache.druid.query.BaseQuery;
+import org.apache.druid.query.dimension.DefaultDimensionSpec;
+import org.apache.druid.query.dimension.DimensionSpec;
+import org.apache.druid.query.filter.ValueMatcher;
+import org.apache.druid.query.monomorphicprocessing.RuntimeShapeInspector;
+import org.apache.druid.segment.column.ColumnCapabilities;
+import org.apache.druid.segment.column.ColumnCapabilitiesImpl;
+import org.apache.druid.segment.data.IndexedInts;
+import org.joda.time.DateTime;
+
+import javax.annotation.Nullable;
+import java.util.BitSet;
+import java.util.LinkedHashSet;
+
+/**
+ * The cursor to help unnest MVDs with dictionary encoding.
+ * Consider a segment has 2 rows
+ * ['a', 'b', 'c']
+ * ['d', 'c']
+ * <p>
+ * Considering dictionary encoding, these are represented as
+ * <p>
+ * 'a' -> 0
+ * 'b' -> 1
+ * 'c' -> 2
+ * 'd' -> 3
+ * <p>
+ * The baseCursor points to the row of IndexedInts [0, 1, 2]
+ * while the unnestCursor with each call of advance() moves over individual elements.
+ * <p>
+ * advance() -> 0 -> 'a'
+ * advance() -> 1 -> 'b'
+ * advance() -> 2 -> 'c'
+ * advance() -> 3 -> 'd' (advances base cursor first)
+ * advance() -> 2 -> 'c'
+ * <p>
+ * Total 5 advance calls above
+ * <p>
+ * The allowSet, if available, helps skip over elements that are not in the allowList by moving the cursor to
+ * the next available match. The hashSet is converted into a bitset (during initialization) for efficiency.
+ * If allowSet is ['c', 'd'] then the advance moves over to the next available match
+ * <p>
+ * advance() -> 2 -> 'c'
+ * advance() -> 3 -> 'd' (advances base cursor first)
+ * advance() -> 2 -> 'c'
+ * <p>
+ * Total 3 advance calls in this case
+ * <p>
+ * The index reference points to the index of each row that the unnest cursor is accessing
+ * The indexedInts for each row are held in the indexedIntsForCurrentRow object
+ * <p>
+ * The needInitialization flag sets up the initial values of indexedIntsForCurrentRow at the beginning of the segment
+ */
+public class UnnestDimensionCursor implements Cursor
+{
+  private final Cursor baseCursor;
+  private final DimensionSelector dimSelector;
+  private final String columnName;
+  private final String outputName;
+  private final LinkedHashSet<String> allowSet;
+  private final BitSet allowedBitSet;
+  private final ColumnSelectorFactory baseColumnSelectorFactory;
+  private int index;
+  private IndexedInts indexedIntsForCurrentRow;
+  private boolean needInitialization;
+  private SingleIndexInts indexIntsForRow;
+
+  public UnnestDimensionCursor(
+      Cursor cursor,
+      ColumnSelectorFactory baseColumnSelectorFactory,
+      String columnName,
+      String outputColumnName,
+      LinkedHashSet<String> allowSet
+  )
+  {
+    this.baseCursor = cursor;
+    this.baseColumnSelectorFactory = baseColumnSelectorFactory;
+    this.dimSelector = this.baseColumnSelectorFactory.makeDimensionSelector(DefaultDimensionSpec.of(columnName));
+    this.columnName = columnName;
+    this.index = 0;
+    this.outputName = outputColumnName;
+    this.needInitialization = true;
+    this.allowSet = allowSet;
+    this.allowedBitSet = new BitSet();
+  }
+
+  @Override
+  public ColumnSelectorFactory getColumnSelectorFactory()
+  {
+    return new ColumnSelectorFactory()
+    {
+      @Override
+      public DimensionSelector makeDimensionSelector(DimensionSpec dimensionSpec)
+      {
+        if (!outputName.equals(dimensionSpec.getDimension())) {
+          return baseColumnSelectorFactory.makeDimensionSelector(dimensionSpec);
+        }
+
+        return new DimensionSelector()
+        {
+          @Override
+          public IndexedInts getRow()
+          {
+            // This object reference has been created
+            // during the call to initialize and referenced henceforth
+            return indexIntsForRow;
+          }
+
+          @Override
+          public ValueMatcher makeValueMatcher(@Nullable String value)
+          {
+            final int idForLookup = idLookup().lookupId(value);
+            if (idForLookup < 0) {
+              return new ValueMatcher()
+              {
+                @Override
+                public boolean matches()
+                {
+                  return false;
+                }
+
+                @Override
+                public void inspectRuntimeShape(RuntimeShapeInspector inspector)
+                {
+
+                }
+              };
+            }
+
+            return new ValueMatcher()
+            {
+              @Override
+              public boolean matches()
+              {
+                return idForLookup == indexedIntsForCurrentRow.get(index);
+              }
+
+              @Override
+              public void inspectRuntimeShape(RuntimeShapeInspector inspector)
+              {
+                dimSelector.inspectRuntimeShape(inspector);
+              }
+            };
+          }
+
+          @Override
+          public ValueMatcher makeValueMatcher(Predicate<String> predicate)
+          {
+            return DimensionSelectorUtils.makeValueMatcherGeneric(this, predicate);
+          }
+
+          @Override
+          public void inspectRuntimeShape(RuntimeShapeInspector inspector)
+          {
+            dimSelector.inspectRuntimeShape(inspector);
+          }
+
+          @Nullable
+          @Override
+          public Object getObject()
+          {
+            if (indexedIntsForCurrentRow == null) {
+              return null;
+            }
+            if (allowedBitSet.isEmpty()) {
+              if (allowSet == null || allowSet.isEmpty()) {
+                return lookupName(indexedIntsForCurrentRow.get(index));
+              }
+            } else if (allowedBitSet.get(indexedIntsForCurrentRow.get(index))) {
+              return lookupName(indexedIntsForCurrentRow.get(index));
+            }
+            return null;
+          }
+
+          @Override
+          public Class<?> classOfObject()
+          {
+            return Object.class;
+          }
+
+          @Override
+          public int getValueCardinality()
+          {
+            if (!allowedBitSet.isEmpty()) {
+              return allowedBitSet.cardinality();
+            }
+            return dimSelector.getValueCardinality();
+          }
+
+          @Nullable
+          @Override
+          public String lookupName(int id)
+          {
+            return dimSelector.lookupName(id);
+          }
+
+          @Override
+          public boolean nameLookupPossibleInAdvance()
+          {
+            return dimSelector.nameLookupPossibleInAdvance();
+          }
+
+          @Nullable
+          @Override
+          public IdLookup idLookup()
+          {
+            return dimSelector.idLookup();
+          }
+        };
+      }
+
+      /*
+      This ideally should not be called. If called delegate using the makeDimensionSelector
+       */
+      @Override
+      public ColumnValueSelector makeColumnValueSelector(String columnName)
+      {
+        if (!outputName.equals(columnName)) {
+          return baseColumnSelectorFactory.makeColumnValueSelector(columnName);
+        }
+        return makeDimensionSelector(DefaultDimensionSpec.of(columnName));
+      }
+
+      @Nullable
+      @Override
+      public ColumnCapabilities getColumnCapabilities(String column)
+      {
+        if (!outputName.equals(column)) {
+          return baseColumnSelectorFactory.getColumnCapabilities(column);
+        }
+        // This currently returns the same type as of the column to be unnested
+        // This is fine for STRING types
+        // But going forward if the dimension to be unnested is of type ARRAY,
+        // this should strip down to the base type of the array
+        final ColumnCapabilities capabilities = baseColumnSelectorFactory.getColumnCapabilities(columnName);
+        if (capabilities.isArray()) {
+          return ColumnCapabilitiesImpl.copyOf(capabilities).setType(capabilities.getElementType());
+        }
+        if (capabilities.hasMultipleValues().isTrue()) {
+          return ColumnCapabilitiesImpl.copyOf(capabilities).setHasMultipleValues(false);
+        }
+        return baseColumnSelectorFactory.getColumnCapabilities(columnName);
+      }
+    };
+  }
+
+  @Override
+  public DateTime getTime()
+  {
+    return baseCursor.getTime();
+  }
+
+  @Override
+  public void advance()
+  {
+    advanceUninterruptibly();
+    BaseQuery.checkInterrupted();
+  }
+
+  @Override
+  public void advanceUninterruptibly()
+  {
+    do {
+      advanceAndUpdate();
+    } while (matchAndProceed());
+  }
+
+  @Override
+  public boolean isDone()
+  {
+    if (needInitialization && !baseCursor.isDone()) {
+      initialize();
+    }
+    return baseCursor.isDone();
+  }
+
+  @Override
+  public boolean isDoneOrInterrupted()
+  {
+    if (needInitialization && !baseCursor.isDoneOrInterrupted()) {
+      initialize();
+    }
+    return baseCursor.isDoneOrInterrupted();
+  }
+
+  @Override
+  public void reset()
+  {
+    index = 0;
+    needInitialization = true;
+    baseCursor.reset();
+  }
+
+  /**
+   * This initializes the unnest cursor and creates data structures
+   * to start iterating over the values to be unnested.
+   * This would also create a bitset for dictonary encoded columns to
+   * check for matching values specified in allowedList of UnnestDataSource.
+   */
+  private void initialize()
+  {
+    IdLookup idLookup = dimSelector.idLookup();
+    this.indexIntsForRow = new SingleIndexInts();
+    if (allowSet != null && !allowSet.isEmpty() && idLookup != null) {
+      for (String s : allowSet) {
+        if (idLookup.lookupId(s) >= 0) {
+          allowedBitSet.set(idLookup.lookupId(s));
+        }
+      }
+    }
+    if (dimSelector.getObject() != null) {
+      this.indexedIntsForCurrentRow = dimSelector.getRow();
+    }
+    if (!allowedBitSet.isEmpty()) {
+      if (!allowedBitSet.get(indexedIntsForCurrentRow.get(index))) {
+        advance();
+      }
+    }
+    needInitialization = false;
+  }
+
+  /**
+   * This advances the cursor to move to the next element to be unnested.
+   * When the last element in a row is unnested, it is also responsible
+   * to move the base cursor to the next row for unnesting and repopulates
+   * the data structures, created during initialize(), to point to the new row
+   */
+  private void advanceAndUpdate()
+  {
+    if (indexedIntsForCurrentRow == null) {
+      index = 0;
+      if (!baseCursor.isDone()) {
+        baseCursor.advanceUninterruptibly();
+      }
+    } else {
+      if (index >= indexedIntsForCurrentRow.size() - 1) {
+        if (!baseCursor.isDone()) {
+          baseCursor.advanceUninterruptibly();
+        }
+        if (!baseCursor.isDone()) {
+          indexedIntsForCurrentRow = dimSelector.getRow();
+        }
+        index = 0;
+      } else {
+        ++index;
+      }
+    }
+  }
+
+  /**
+   * This advances the unnest cursor in cases where an allowList is specified
+   * and the current value at the unnest cursor is not in the allowList.
+   * The cursor in such cases is moved till the next match is found.
+   *
+   * @return a boolean to indicate whether to stay or move cursor
+   */
+  private boolean matchAndProceed()
+  {
+    boolean matchStatus;
+    if ((allowSet == null || allowSet.isEmpty()) && allowedBitSet.isEmpty()) {
+      matchStatus = true;
+    } else {
+      matchStatus = allowedBitSet.get(indexedIntsForCurrentRow.get(index));
+    }
+    return !baseCursor.isDone() && !matchStatus;
+  }
+
+  // Helper class to help in returning
+  // getRow from the dimensionSelector
+  // This is set in the initialize method
+  private class SingleIndexInts implements IndexedInts
+  {
+
+    @Override
+    public void inspectRuntimeShape(RuntimeShapeInspector inspector)
+    {
+      //nothing to inspect
+    }
+
+    @Override
+    public int size()
+    {
+      // After unnest each row will have a single element
+      return 1;
+    }
+
+    @Override
+    public int get(int idx)
+    {
+      return indexedIntsForCurrentRow.get(index);
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/segment/UnnestSegmentReference.java b/processing/src/main/java/org/apache/druid/segment/UnnestSegmentReference.java
new file mode 100644
index 000000000000..9da6b8132cbb
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/segment/UnnestSegmentReference.java
@@ -0,0 +1,115 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment;
+
+import org.apache.druid.java.util.common.io.Closer;
+import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.timeline.SegmentId;
+import org.apache.druid.utils.CloseableUtils;
+import org.joda.time.Interval;
+
+import javax.annotation.Nullable;
+import java.io.Closeable;
+import java.io.IOException;
+import java.util.LinkedHashSet;
+import java.util.Optional;
+
+/**
+ * The segment reference for the Unnest Data Source.
+ * The input column name, output name and the allowSet follow from {@link org.apache.druid.query.UnnestDataSource}
+ */
+public class UnnestSegmentReference implements SegmentReference
+{
+  private static final Logger log = new Logger(UnnestSegmentReference.class);
+
+  private final SegmentReference baseSegment;
+  private final String dimension;
+  private final String renamedOutputDimension;
+  private final LinkedHashSet<String> allowSet;
+
+  public UnnestSegmentReference(SegmentReference baseSegment, String dimension, String outputName, LinkedHashSet<String> allowList)
+  {
+    this.baseSegment = baseSegment;
+    this.dimension = dimension;
+    this.renamedOutputDimension = outputName;
+    this.allowSet = allowList;
+  }
+
+  @Override
+  public Optional<Closeable> acquireReferences()
+  {
+    Closer closer = Closer.create();
+    try {
+      boolean acquireFailed = baseSegment.acquireReferences().map(closeable -> {
+        closer.register(closeable);
+        return false;
+      }).orElse(true);
+
+      if (acquireFailed) {
+        CloseableUtils.closeAndWrapExceptions(closer);
+        return Optional.empty();
+      } else {
+        return Optional.of(closer);
+      }
+    }
+    catch (Throwable e) {
+      // acquireReferences is not permitted to throw exceptions.
+      CloseableUtils.closeAndSuppressExceptions(closer, e::addSuppressed);
+      log.warn(e, "Exception encountered while trying to acquire reference");
+      return Optional.empty();
+    }
+  }
+
+  @Override
+  public SegmentId getId()
+  {
+    return baseSegment.getId();
+  }
+
+  @Override
+  public Interval getDataInterval()
+  {
+    return baseSegment.getDataInterval();
+  }
+
+  @Nullable
+  @Override
+  public QueryableIndex asQueryableIndex()
+  {
+    return null;
+  }
+
+  @Override
+  public StorageAdapter asStorageAdapter()
+  {
+    return new UnnestStorageAdapter(
+        baseSegment.asStorageAdapter(),
+        dimension,
+        renamedOutputDimension,
+        allowSet
+    );
+  }
+
+  @Override
+  public void close() throws IOException
+  {
+    baseSegment.close();
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/segment/UnnestStorageAdapter.java b/processing/src/main/java/org/apache/druid/segment/UnnestStorageAdapter.java
new file mode 100644
index 000000000000..f76ab89270af
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/segment/UnnestStorageAdapter.java
@@ -0,0 +1,234 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment;
+
+import com.google.common.collect.Lists;
+import org.apache.druid.java.util.common.granularity.Granularity;
+import org.apache.druid.java.util.common.guava.Sequence;
+import org.apache.druid.java.util.common.guava.Sequences;
+import org.apache.druid.query.QueryMetrics;
+import org.apache.druid.query.filter.Filter;
+import org.apache.druid.query.filter.InDimFilter;
+import org.apache.druid.segment.column.ColumnCapabilities;
+import org.apache.druid.segment.data.Indexed;
+import org.apache.druid.segment.data.ListIndexed;
+import org.apache.druid.segment.filter.AndFilter;
+import org.joda.time.DateTime;
+import org.joda.time.Interval;
+
+import javax.annotation.Nullable;
+import java.util.Arrays;
+import java.util.LinkedHashSet;
+import java.util.Objects;
+
+/**
+ * This class serves as the Storage Adapter for the Unnest Segment and is responsible for creating the cursors
+ * If the column is dictionary encoded it creates {@link UnnestDimensionCursor} else {@link UnnestColumnValueSelectorCursor}
+ * These cursors help navigate the segments for these cases
+ */
+public class UnnestStorageAdapter implements StorageAdapter
+{
+  private final StorageAdapter baseAdapter;
+  private final String dimensionToUnnest;
+  private final String outputColumnName;
+  private final LinkedHashSet<String> allowSet;
+
+  public UnnestStorageAdapter(
+      final StorageAdapter baseAdapter,
+      final String dimension,
+      final String outputColumnName,
+      final LinkedHashSet<String> allowSet
+  )
+  {
+    this.baseAdapter = baseAdapter;
+    this.dimensionToUnnest = dimension;
+    this.outputColumnName = outputColumnName;
+    this.allowSet = allowSet;
+  }
+
+  @Override
+  public Sequence<Cursor> makeCursors(
+      @Nullable Filter filter,
+      Interval interval,
+      VirtualColumns virtualColumns,
+      Granularity gran,
+      boolean descending,
+      @Nullable QueryMetrics<?> queryMetrics
+  )
+  {
+    Filter updatedFilter;
+    if (allowSet != null && !allowSet.isEmpty()) {
+      final InDimFilter allowListFilters;
+      allowListFilters = new InDimFilter(dimensionToUnnest, allowSet);
+      if (filter != null) {
+        updatedFilter = new AndFilter(Arrays.asList(filter, allowListFilters));
+      } else {
+        updatedFilter = allowListFilters;
+      }
+    } else {
+      updatedFilter = filter;
+    }
+    final Sequence<Cursor> baseCursorSequence = baseAdapter.makeCursors(
+        updatedFilter,
+        interval,
+        virtualColumns,
+        gran,
+        descending,
+        queryMetrics
+    );
+
+    return Sequences.map(
+        baseCursorSequence,
+        cursor -> {
+          Objects.requireNonNull(cursor);
+          Cursor retVal = cursor;
+          ColumnCapabilities capabilities = cursor.getColumnSelectorFactory().getColumnCapabilities(dimensionToUnnest);
+          if (capabilities != null) {
+            if (capabilities.isDictionaryEncoded().and(capabilities.areDictionaryValuesUnique()).isTrue()) {
+              retVal = new UnnestDimensionCursor(
+                  retVal,
+                  retVal.getColumnSelectorFactory(),
+                  dimensionToUnnest,
+                  outputColumnName,
+                  allowSet
+              );
+            } else {
+              retVal = new UnnestColumnValueSelectorCursor(
+                  retVal,
+                  retVal.getColumnSelectorFactory(),
+                  dimensionToUnnest,
+                  outputColumnName,
+                  allowSet
+              );
+            }
+          } else {
+            retVal = new UnnestColumnValueSelectorCursor(
+                retVal,
+                retVal.getColumnSelectorFactory(),
+                dimensionToUnnest,
+                outputColumnName,
+                allowSet
+            );
+          }
+          return retVal;
+        }
+    );
+  }
+
+  @Override
+  public Interval getInterval()
+  {
+    return baseAdapter.getInterval();
+  }
+
+  @Override
+  public Indexed<String> getAvailableDimensions()
+  {
+    final LinkedHashSet<String> availableDimensions = new LinkedHashSet<>();
+
+    for (String dim : baseAdapter.getAvailableDimensions()) {
+      availableDimensions.add(dim);
+    }
+    availableDimensions.add(outputColumnName);
+    return new ListIndexed<>(Lists.newArrayList(availableDimensions));
+  }
+
+  @Override
+  public Iterable<String> getAvailableMetrics()
+  {
+    return baseAdapter.getAvailableMetrics();
+  }
+
+  @Override
+  public int getDimensionCardinality(String column)
+  {
+    if (!outputColumnName.equals(column)) {
+      return baseAdapter.getDimensionCardinality(column);
+    }
+    return baseAdapter.getDimensionCardinality(dimensionToUnnest);
+  }
+
+  @Override
+  public DateTime getMinTime()
+  {
+    return baseAdapter.getMinTime();
+  }
+
+  @Override
+  public DateTime getMaxTime()
+  {
+    return baseAdapter.getMaxTime();
+  }
+
+  @Nullable
+  @Override
+  public Comparable getMinValue(String column)
+  {
+    if (!outputColumnName.equals(column)) {
+      return baseAdapter.getMinValue(column);
+    }
+    return baseAdapter.getMinValue(dimensionToUnnest);
+  }
+
+  @Nullable
+  @Override
+  public Comparable getMaxValue(String column)
+  {
+    if (!outputColumnName.equals(column)) {
+      return baseAdapter.getMaxValue(column);
+    }
+    return baseAdapter.getMaxValue(dimensionToUnnest);
+  }
+
+  @Nullable
+  @Override
+  public ColumnCapabilities getColumnCapabilities(String column)
+  {
+    if (!outputColumnName.equals(column)) {
+      return baseAdapter.getColumnCapabilities(column);
+    }
+    return baseAdapter.getColumnCapabilities(dimensionToUnnest);
+  }
+
+  @Override
+  public int getNumRows()
+  {
+    return 0;
+  }
+
+  @Override
+  public DateTime getMaxIngestedEventTime()
+  {
+    return baseAdapter.getMaxIngestedEventTime();
+  }
+
+  @Nullable
+  @Override
+  public Metadata getMetadata()
+  {
+    return baseAdapter.getMetadata();
+  }
+
+  public String getDimensionToUnnest()
+  {
+    return dimensionToUnnest;
+  }
+}
+
diff --git a/processing/src/main/java/org/apache/druid/segment/column/ObjectStrategyComplexTypeStrategy.java b/processing/src/main/java/org/apache/druid/segment/column/ObjectStrategyComplexTypeStrategy.java
index 351f2665d05e..93b992a4f428 100644
--- a/processing/src/main/java/org/apache/druid/segment/column/ObjectStrategyComplexTypeStrategy.java
+++ b/processing/src/main/java/org/apache/druid/segment/column/ObjectStrategyComplexTypeStrategy.java
@@ -82,14 +82,14 @@ public int write(ByteBuffer buffer, T value, int maxSizeBytes)
   }
 
   @Override
-  public int compare(T o1, T o2)
+  public int compare(Object o1, Object o2)
   {
-    return objectStrategy.compare(o1, o2);
+    return objectStrategy.compare((T) o1, (T) o2);
   }
 
   @Override
   public T fromBytes(byte[] value)
   {
-    return objectStrategy.fromByteBuffer(ByteBuffer.wrap(value), value.length);
+    return objectStrategy.fromByteBufferSafe(ByteBuffer.wrap(value), value.length);
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarDoublesSupplier.java b/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarDoublesSupplier.java
index 28b3c5d2b6c3..98a7ab51f987 100644
--- a/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarDoublesSupplier.java
+++ b/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarDoublesSupplier.java
@@ -22,6 +22,7 @@
 import com.google.common.base.Supplier;
 import org.apache.druid.collections.ResourceHolder;
 
+import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
 import java.nio.ByteOrder;
 import java.nio.DoubleBuffer;
@@ -82,10 +83,12 @@ private class BlockLayoutColumnarDoubles implements ColumnarDoubles
     final Indexed<ResourceHolder<ByteBuffer>> singleThreadedDoubleBuffers = baseDoubleBuffers.singleThreaded();
 
     int currBufferNum = -1;
+    @Nullable
     ResourceHolder<ByteBuffer> holder;
     /**
      * doubleBuffer's position must be 0
      */
+    @Nullable
     DoubleBuffer doubleBuffer;
 
     @Override
@@ -180,7 +183,10 @@ protected void loadBuffer(int bufferNum)
     public void close()
     {
       if (holder != null) {
+        currBufferNum = -1;
         holder.close();
+        holder = null;
+        doubleBuffer = null;
       }
     }
 
diff --git a/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarFloatsSupplier.java b/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarFloatsSupplier.java
index c11ba18ec3df..26d7c798c79e 100644
--- a/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarFloatsSupplier.java
+++ b/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarFloatsSupplier.java
@@ -22,6 +22,7 @@
 import com.google.common.base.Supplier;
 import org.apache.druid.collections.ResourceHolder;
 
+import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
 import java.nio.ByteOrder;
 import java.nio.FloatBuffer;
@@ -82,10 +83,12 @@ private class BlockLayoutColumnarFloats implements ColumnarFloats
     final Indexed<ResourceHolder<ByteBuffer>> singleThreadedFloatBuffers = baseFloatBuffers.singleThreaded();
 
     int currBufferNum = -1;
+    @Nullable
     ResourceHolder<ByteBuffer> holder;
     /**
      * floatBuffer's position must be 0
      */
+    @Nullable
     FloatBuffer floatBuffer;
 
     @Override
@@ -180,7 +183,10 @@ protected void loadBuffer(int bufferNum)
     public void close()
     {
       if (holder != null) {
+        currBufferNum = -1;
         holder.close();
+        holder = null;
+        floatBuffer = null;
       }
     }
 
diff --git a/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarLongsSupplier.java b/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarLongsSupplier.java
index 05473320553f..29a0748bcee5 100644
--- a/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarLongsSupplier.java
+++ b/processing/src/main/java/org/apache/druid/segment/data/BlockLayoutColumnarLongsSupplier.java
@@ -22,6 +22,7 @@
 import com.google.common.base.Supplier;
 import org.apache.druid.collections.ResourceHolder;
 
+import javax.annotation.Nullable;
 import java.nio.ByteBuffer;
 import java.nio.ByteOrder;
 import java.nio.LongBuffer;
@@ -123,11 +124,14 @@ private class BlockLayoutColumnarLongs implements ColumnarLongs
     final Indexed<ResourceHolder<ByteBuffer>> singleThreadedLongBuffers = baseLongBuffers.singleThreaded();
 
     int currBufferNum = -1;
+    @Nullable
     ResourceHolder<ByteBuffer> holder;
+    @Nullable
     ByteBuffer buffer;
     /**
      * longBuffer's position must be 0
      */
+    @Nullable
     LongBuffer longBuffer;
 
     @Override
@@ -204,7 +208,11 @@ protected void loadBuffer(int bufferNum)
     public void close()
     {
       if (holder != null) {
+        currBufferNum = -1;
         holder.close();
+        holder = null;
+        buffer = null;
+        longBuffer = null;
       }
     }
 
diff --git a/processing/src/main/java/org/apache/druid/segment/data/ObjectStrategy.java b/processing/src/main/java/org/apache/druid/segment/data/ObjectStrategy.java
index 8a53fc57a7d7..eba97d04bbbe 100644
--- a/processing/src/main/java/org/apache/druid/segment/data/ObjectStrategy.java
+++ b/processing/src/main/java/org/apache/druid/segment/data/ObjectStrategy.java
@@ -79,4 +79,31 @@ default void writeTo(T val, WriteOutBytes out) throws IOException
       out.write(bytes);
     }
   }
+
+  /**
+   * Convert values from their underlying byte representation, when the underlying bytes might be corrupted or
+   * maliciously constructed
+   *
+   * Implementations of this method <i>absolutely must never</i> perform any sun.misc.Unsafe based memory read or write
+   * operations from instructions contained in the data read from this buffer without first validating the data. If the
+   * data cannot be validated, all read and write operations from instructions in this data must be done directly with
+   * the {@link ByteBuffer} methods, or using {@link SafeWritableMemory} if
+   * {@link org.apache.datasketches.memory.Memory} is employed to materialize the value.
+   *
+   * Implementations of this method <i>may</i> change the given buffer's mark, or limit, and position.
+   *
+   * Implementations of this method <i>may not</i> store the given buffer in a field of the "deserialized" object,
+   * need to use {@link ByteBuffer#slice()}, {@link ByteBuffer#asReadOnlyBuffer()} or {@link ByteBuffer#duplicate()} in
+   * this case.
+   *
+   *
+   * @param buffer buffer to read value from
+   * @param numBytes number of bytes used to store the value, starting at buffer.position()
+   * @return an object created from the given byte buffer representation
+   */
+  @Nullable
+  default T fromByteBufferSafe(ByteBuffer buffer, int numBytes)
+  {
+    return fromByteBuffer(buffer, numBytes);
+  }
 }
diff --git a/processing/src/main/java/org/apache/druid/segment/data/SafeWritableBase.java b/processing/src/main/java/org/apache/druid/segment/data/SafeWritableBase.java
new file mode 100644
index 000000000000..df2fc14d0535
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/segment/data/SafeWritableBase.java
@@ -0,0 +1,450 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment.data;
+
+import com.google.common.base.Preconditions;
+import com.google.common.primitives.Ints;
+import org.apache.datasketches.memory.BaseState;
+import org.apache.datasketches.memory.MemoryRequestServer;
+import org.apache.datasketches.memory.WritableMemory;
+import org.apache.datasketches.memory.internal.BaseStateImpl;
+import org.apache.datasketches.memory.internal.UnsafeUtil;
+import org.apache.datasketches.memory.internal.XxHash64;
+import org.apache.druid.java.util.common.StringUtils;
+
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
+/**
+ * Base class for making a regular {@link ByteBuffer} look like a {@link org.apache.datasketches.memory.Memory} or
+ * {@link org.apache.datasketches.memory.Buffer}. All methods delegate directly to the {@link ByteBuffer} rather
+ * than using 'unsafe' reads.
+ *
+ * @see SafeWritableMemory
+ * @see SafeWritableBuffer
+ */
+
+@SuppressWarnings("unused")
+public abstract class SafeWritableBase implements BaseState
+{
+  static final MemoryRequestServer SAFE_HEAP_REQUEST_SERVER = new HeapByteBufferMemoryRequestServer();
+
+  final ByteBuffer buffer;
+
+  public SafeWritableBase(ByteBuffer buffer)
+  {
+    this.buffer = buffer;
+  }
+
+  public MemoryRequestServer getMemoryRequestServer()
+  {
+    return SAFE_HEAP_REQUEST_SERVER;
+  }
+
+  public boolean getBoolean(long offsetBytes)
+  {
+    return getByte(Ints.checkedCast(offsetBytes)) != 0;
+  }
+
+  public byte getByte(long offsetBytes)
+  {
+    return buffer.get(Ints.checkedCast(offsetBytes));
+  }
+
+  public char getChar(long offsetBytes)
+  {
+    return buffer.getChar(Ints.checkedCast(offsetBytes));
+  }
+
+  public double getDouble(long offsetBytes)
+  {
+    return buffer.getDouble(Ints.checkedCast(offsetBytes));
+  }
+
+  public float getFloat(long offsetBytes)
+  {
+    return buffer.getFloat(Ints.checkedCast(offsetBytes));
+  }
+
+  public int getInt(long offsetBytes)
+  {
+    return buffer.getInt(Ints.checkedCast(offsetBytes));
+  }
+
+  public long getLong(long offsetBytes)
+  {
+    return buffer.getLong(Ints.checkedCast(offsetBytes));
+  }
+
+  public short getShort(long offsetBytes)
+  {
+    return buffer.getShort(Ints.checkedCast(offsetBytes));
+  }
+
+  public void putBoolean(long offsetBytes, boolean value)
+  {
+    buffer.put(Ints.checkedCast(offsetBytes), (byte) (value ? 1 : 0));
+  }
+
+  public void putByte(long offsetBytes, byte value)
+  {
+    buffer.put(Ints.checkedCast(offsetBytes), value);
+  }
+
+  public void putChar(long offsetBytes, char value)
+  {
+    buffer.putChar(Ints.checkedCast(offsetBytes), value);
+  }
+
+  public void putDouble(long offsetBytes, double value)
+  {
+    buffer.putDouble(Ints.checkedCast(offsetBytes), value);
+  }
+
+  public void putFloat(long offsetBytes, float value)
+  {
+    buffer.putFloat(Ints.checkedCast(offsetBytes), value);
+  }
+
+  public void putInt(long offsetBytes, int value)
+  {
+    buffer.putInt(Ints.checkedCast(offsetBytes), value);
+  }
+
+  public void putLong(long offsetBytes, long value)
+  {
+    buffer.putLong(Ints.checkedCast(offsetBytes), value);
+  }
+
+  public void putShort(long offsetBytes, short value)
+  {
+    buffer.putShort(Ints.checkedCast(offsetBytes), value);
+  }
+
+  @Override
+  public ByteOrder getTypeByteOrder()
+  {
+    return buffer.order();
+  }
+
+  @Override
+  public boolean isByteOrderCompatible(ByteOrder byteOrder)
+  {
+    return buffer.order().equals(byteOrder);
+  }
+
+  @Override
+  public ByteBuffer getByteBuffer()
+  {
+    return buffer;
+  }
+
+  @Override
+  public long getCapacity()
+  {
+    return buffer.capacity();
+  }
+
+  @Override
+  public long getCumulativeOffset()
+  {
+    return 0;
+  }
+
+  @Override
+  public long getCumulativeOffset(long offsetBytes)
+  {
+    return offsetBytes;
+  }
+
+  @Override
+  public long getRegionOffset()
+  {
+    return 0;
+  }
+
+  @Override
+  public long getRegionOffset(long offsetBytes)
+  {
+    return offsetBytes;
+  }
+
+  @Override
+  public boolean hasArray()
+  {
+    return false;
+  }
+
+  @Override
+  public long xxHash64(long offsetBytes, long lengthBytes, long seed)
+  {
+    return hash(buffer, offsetBytes, lengthBytes, seed);
+  }
+
+  @Override
+  public long xxHash64(long in, long seed)
+  {
+    return XxHash64.hash(in, seed);
+  }
+
+  @Override
+  public boolean hasByteBuffer()
+  {
+    return true;
+  }
+
+  @Override
+  public boolean isDirect()
+  {
+    return false;
+  }
+
+  @Override
+  public boolean isReadOnly()
+  {
+    return false;
+  }
+
+  @Override
+  public boolean isSameResource(Object that)
+  {
+    return this.equals(that);
+  }
+
+  @Override
+  public boolean isValid()
+  {
+    return true;
+  }
+
+  @Override
+  public void checkValidAndBounds(long offsetBytes, long lengthBytes)
+  {
+    Preconditions.checkArgument(
+        Ints.checkedCast(offsetBytes) < buffer.limit(),
+        "start offset %s is greater than buffer limit %s",
+        offsetBytes,
+        buffer.limit()
+    );
+    Preconditions.checkArgument(
+        Ints.checkedCast(offsetBytes + lengthBytes) < buffer.limit(),
+        "end offset %s is greater than buffer limit %s",
+        offsetBytes + lengthBytes,
+        buffer.limit()
+    );
+  }
+
+  /**
+   * Adapted from {@link BaseStateImpl#toHexString(String, long, int)}
+   */
+  @Override
+  public String toHexString(String header, long offsetBytes, int lengthBytes)
+  {
+    final String klass = this.getClass().getSimpleName();
+    final String s1 = StringUtils.format("(..., %d, %d)", offsetBytes, lengthBytes);
+    final long hcode = hashCode() & 0XFFFFFFFFL;
+    final String call = ".toHexString" + s1 + ", hashCode: " + hcode;
+    String sb = "### " + klass + " SUMMARY ###" + UnsafeUtil.LS
+                + "Header Comment      : " + header + UnsafeUtil.LS
+                + "Call Parameters     : " + call;
+    return toHex(this, sb, offsetBytes, lengthBytes);
+  }
+
+  /**
+   * Adapted from {@link BaseStateImpl#toHex(BaseStateImpl, String, long, int)}
+   */
+  static String toHex(
+      final SafeWritableBase state,
+      final String preamble,
+      final long offsetBytes,
+      final int lengthBytes
+  )
+  {
+    final String lineSeparator = UnsafeUtil.LS;
+    final long capacity = state.getCapacity();
+    UnsafeUtil.checkBounds(offsetBytes, lengthBytes, capacity);
+    final StringBuilder sb = new StringBuilder();
+    final String uObjStr;
+    final long uObjHeader;
+    uObjStr = "null";
+    uObjHeader = 0;
+    final ByteBuffer bb = state.getByteBuffer();
+    final String bbStr = bb == null ? "null"
+                                    : bb.getClass().getSimpleName() + ", " + (bb.hashCode() & 0XFFFFFFFFL);
+    final MemoryRequestServer memReqSvr = state.getMemoryRequestServer();
+    final String memReqStr = memReqSvr != null
+                             ? memReqSvr.getClass().getSimpleName() + ", " + (memReqSvr.hashCode() & 0XFFFFFFFFL)
+                             : "null";
+    final long cumBaseOffset = state.getCumulativeOffset();
+    sb.append(preamble).append(lineSeparator);
+    sb.append("UnsafeObj, hashCode : ").append(uObjStr).append(lineSeparator);
+    sb.append("UnsafeObjHeader     : ").append(uObjHeader).append(lineSeparator);
+    sb.append("ByteBuf, hashCode   : ").append(bbStr).append(lineSeparator);
+    sb.append("RegionOffset        : ").append(state.getRegionOffset()).append(lineSeparator);
+    sb.append("Capacity            : ").append(capacity).append(lineSeparator);
+    sb.append("CumBaseOffset       : ").append(cumBaseOffset).append(lineSeparator);
+    sb.append("MemReq, hashCode    : ").append(memReqStr).append(lineSeparator);
+    sb.append("Valid               : ").append(state.isValid()).append(lineSeparator);
+    sb.append("Read Only           : ").append(state.isReadOnly()).append(lineSeparator);
+    sb.append("Type Byte Order     : ").append(state.getTypeByteOrder()).append(lineSeparator);
+    sb.append("Native Byte Order   : ").append(ByteOrder.nativeOrder()).append(lineSeparator);
+    sb.append("JDK Runtime Version : ").append(UnsafeUtil.JDK).append(lineSeparator);
+    //Data detail
+    sb.append("Data, littleEndian  :  0  1  2  3  4  5  6  7");
+
+    for (long i = 0; i < lengthBytes; i++) {
+      final int b = state.getByte(cumBaseOffset + offsetBytes + i) & 0XFF;
+      if (i % 8 == 0) { //row header
+        sb.append(StringUtils.format("%n%20s: ", offsetBytes + i));
+      }
+      sb.append(StringUtils.format("%02x ", b));
+    }
+    sb.append(lineSeparator);
+
+    return sb.toString();
+  }
+
+  // copied from datasketches-memory XxHash64.java
+  private static final long P1 = -7046029288634856825L;
+  private static final long P2 = -4417276706812531889L;
+  private static final long P3 = 1609587929392839161L;
+  private static final long P4 = -8796714831421723037L;
+  private static final long P5 = 2870177450012600261L;
+
+  /**
+   * Adapted from {@link XxHash64#hash(Object, long, long, long)} to work with {@link ByteBuffer}
+   */
+  static long hash(ByteBuffer memory, long cumOffsetBytes, final long lengthBytes, final long seed)
+  {
+    long hash;
+    long remaining = lengthBytes;
+    int offset = Ints.checkedCast(cumOffsetBytes);
+
+    if (remaining >= 32) {
+      long v1 = seed + P1 + P2;
+      long v2 = seed + P2;
+      long v3 = seed;
+      long v4 = seed - P1;
+
+      do {
+        v1 += memory.getLong(offset) * P2;
+        v1 = Long.rotateLeft(v1, 31);
+        v1 *= P1;
+
+        v2 += memory.getLong(offset + 8) * P2;
+        v2 = Long.rotateLeft(v2, 31);
+        v2 *= P1;
+
+        v3 += memory.getLong(offset + 16) * P2;
+        v3 = Long.rotateLeft(v3, 31);
+        v3 *= P1;
+
+        v4 += memory.getLong(offset + 24) * P2;
+        v4 = Long.rotateLeft(v4, 31);
+        v4 *= P1;
+
+        offset += 32;
+        remaining -= 32;
+      } while (remaining >= 32);
+
+      hash = Long.rotateLeft(v1, 1)
+             + Long.rotateLeft(v2, 7)
+             + Long.rotateLeft(v3, 12)
+             + Long.rotateLeft(v4, 18);
+
+      v1 *= P2;
+      v1 = Long.rotateLeft(v1, 31);
+      v1 *= P1;
+      hash ^= v1;
+      hash = (hash * P1) + P4;
+
+      v2 *= P2;
+      v2 = Long.rotateLeft(v2, 31);
+      v2 *= P1;
+      hash ^= v2;
+      hash = (hash * P1) + P4;
+
+      v3 *= P2;
+      v3 = Long.rotateLeft(v3, 31);
+      v3 *= P1;
+      hash ^= v3;
+      hash = (hash * P1) + P4;
+
+      v4 *= P2;
+      v4 = Long.rotateLeft(v4, 31);
+      v4 *= P1;
+      hash ^= v4;
+      hash = (hash * P1) + P4;
+    } else { //end remaining >= 32
+      hash = seed + P5;
+    }
+
+    hash += lengthBytes;
+
+    while (remaining >= 8) {
+      long k1 = memory.getLong(offset);
+      k1 *= P2;
+      k1 = Long.rotateLeft(k1, 31);
+      k1 *= P1;
+      hash ^= k1;
+      hash = (Long.rotateLeft(hash, 27) * P1) + P4;
+      offset += 8;
+      remaining -= 8;
+    }
+
+    if (remaining >= 4) { //treat as unsigned ints
+      hash ^= (memory.getInt(offset) & 0XFFFF_FFFFL) * P1;
+      hash = (Long.rotateLeft(hash, 23) * P2) + P3;
+      offset += 4;
+      remaining -= 4;
+    }
+
+    while (remaining != 0) { //treat as unsigned bytes
+      hash ^= (memory.get(offset) & 0XFFL) * P5;
+      hash = Long.rotateLeft(hash, 11) * P1;
+      --remaining;
+      ++offset;
+    }
+
+    hash ^= hash >>> 33;
+    hash *= P2;
+    hash ^= hash >>> 29;
+    hash *= P3;
+    hash ^= hash >>> 32;
+    return hash;
+  }
+
+  private static class HeapByteBufferMemoryRequestServer implements MemoryRequestServer
+  {
+    @Override
+    public WritableMemory request(WritableMemory currentWritableMemory, long capacityBytes)
+    {
+      ByteBuffer newBuffer = ByteBuffer.allocate(Ints.checkedCast(capacityBytes));
+      newBuffer.order(currentWritableMemory.getTypeByteOrder());
+      return new SafeWritableMemory(newBuffer);
+    }
+
+    @Override
+    public void requestClose(WritableMemory memToClose, WritableMemory newMemory)
+    {
+      // do nothing
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/segment/data/SafeWritableBuffer.java b/processing/src/main/java/org/apache/druid/segment/data/SafeWritableBuffer.java
new file mode 100644
index 000000000000..3da7e70b457c
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/segment/data/SafeWritableBuffer.java
@@ -0,0 +1,501 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment.data;
+
+import com.google.common.primitives.Ints;
+import org.apache.datasketches.memory.BaseBuffer;
+import org.apache.datasketches.memory.Buffer;
+import org.apache.datasketches.memory.Memory;
+import org.apache.datasketches.memory.WritableBuffer;
+import org.apache.datasketches.memory.WritableMemory;
+
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
+/**
+ * Safety first! Don't trust something whose contents you locations to read and write stuff to, but need a
+ * {@link Buffer} or {@link WritableBuffer}? use this!
+ * <p>
+ * Delegates everything to an underlying {@link ByteBuffer} so all read and write operations will have bounds checks
+ * built in rather than using 'unsafe'.
+ */
+public class SafeWritableBuffer extends SafeWritableBase implements WritableBuffer
+{
+  private int start;
+  private int end;
+
+  public SafeWritableBuffer(ByteBuffer buffer)
+  {
+    super(buffer);
+    this.start = 0;
+    this.buffer.position(0);
+    this.end = buffer.capacity();
+  }
+
+  @Override
+  public WritableBuffer writableDuplicate()
+  {
+    return writableDuplicate(buffer.order());
+  }
+
+  @Override
+  public WritableBuffer writableDuplicate(ByteOrder byteOrder)
+  {
+    ByteBuffer dupe = buffer.duplicate();
+    dupe.order(byteOrder);
+    WritableBuffer duplicate = new SafeWritableBuffer(dupe);
+    duplicate.setStartPositionEnd(start, buffer.position(), end);
+    return duplicate;
+  }
+
+  @Override
+  public WritableBuffer writableRegion()
+  {
+    ByteBuffer dupe = buffer.duplicate().order(buffer.order());
+    dupe.position(start);
+    dupe.limit(end);
+    ByteBuffer remaining = buffer.slice();
+    remaining.order(dupe.order());
+    return new SafeWritableBuffer(remaining);
+  }
+
+  @Override
+  public WritableBuffer writableRegion(long offsetBytes, long capacityBytes, ByteOrder byteOrder)
+  {
+    ByteBuffer dupe = buffer.duplicate();
+    dupe.position(Ints.checkedCast(offsetBytes));
+    dupe.limit(dupe.position() + Ints.checkedCast(capacityBytes));
+    return new SafeWritableBuffer(dupe.slice().order(byteOrder));
+  }
+
+  @Override
+  public WritableMemory asWritableMemory(ByteOrder byteOrder)
+  {
+    ByteBuffer dupe = buffer.duplicate();
+    dupe.order(byteOrder);
+    return new SafeWritableMemory(dupe);
+  }
+
+  @Override
+  public void putBoolean(boolean value)
+  {
+    buffer.put((byte) (value ? 1 : 0));
+  }
+
+  @Override
+  public void putBooleanArray(boolean[] srcArray, int srcOffsetBooleans, int lengthBooleans)
+  {
+    for (int i = 0; i < lengthBooleans; i++) {
+      putBoolean(srcArray[srcOffsetBooleans + i]);
+    }
+  }
+
+  @Override
+  public void putByte(byte value)
+  {
+    buffer.put(value);
+  }
+
+  @Override
+  public void putByteArray(byte[] srcArray, int srcOffsetBytes, int lengthBytes)
+  {
+    buffer.put(srcArray, srcOffsetBytes, lengthBytes);
+  }
+
+  @Override
+  public void putChar(char value)
+  {
+    buffer.putChar(value);
+  }
+
+  @Override
+  public void putCharArray(char[] srcArray, int srcOffsetChars, int lengthChars)
+  {
+    for (int i = 0; i < lengthChars; i++) {
+      buffer.putChar(srcArray[srcOffsetChars + i]);
+    }
+  }
+
+  @Override
+  public void putDouble(double value)
+  {
+    buffer.putDouble(value);
+  }
+
+  @Override
+  public void putDoubleArray(double[] srcArray, int srcOffsetDoubles, int lengthDoubles)
+  {
+    for (int i = 0; i < lengthDoubles; i++) {
+      buffer.putDouble(srcArray[srcOffsetDoubles + i]);
+    }
+  }
+
+  @Override
+  public void putFloat(float value)
+  {
+    buffer.putFloat(value);
+  }
+
+  @Override
+  public void putFloatArray(float[] srcArray, int srcOffsetFloats, int lengthFloats)
+  {
+    for (int i = 0; i < lengthFloats; i++) {
+      buffer.putFloat(srcArray[srcOffsetFloats + i]);
+    }
+  }
+
+  @Override
+  public void putInt(int value)
+  {
+    buffer.putInt(value);
+  }
+
+  @Override
+  public void putIntArray(int[] srcArray, int srcOffsetInts, int lengthInts)
+  {
+    for (int i = 0; i < lengthInts; i++) {
+      buffer.putInt(srcArray[srcOffsetInts + i]);
+    }
+  }
+
+  @Override
+  public void putLong(long value)
+  {
+    buffer.putLong(value);
+  }
+
+  @Override
+  public void putLongArray(long[] srcArray, int srcOffsetLongs, int lengthLongs)
+  {
+    for (int i = 0; i < lengthLongs; i++) {
+      buffer.putLong(srcArray[srcOffsetLongs + i]);
+    }
+  }
+
+  @Override
+  public void putShort(short value)
+  {
+    buffer.putShort(value);
+  }
+
+  @Override
+  public void putShortArray(short[] srcArray, int srcOffsetShorts, int lengthShorts)
+  {
+    for (int i = 0; i < lengthShorts; i++) {
+      buffer.putShort(srcArray[srcOffsetShorts + i]);
+    }
+  }
+
+  @Override
+  public Object getArray()
+  {
+    return null;
+  }
+
+  @Override
+  public void clear()
+  {
+    fill((byte) 0);
+  }
+
+  @Override
+  public void fill(byte value)
+  {
+    while (buffer.hasRemaining() && buffer.position() < end) {
+      buffer.put(value);
+    }
+  }
+
+  @Override
+  public Buffer duplicate()
+  {
+    return writableDuplicate();
+  }
+
+  @Override
+  public Buffer duplicate(ByteOrder byteOrder)
+  {
+    return writableDuplicate(byteOrder);
+  }
+
+  @Override
+  public Buffer region()
+  {
+    return writableRegion();
+  }
+
+  @Override
+  public Buffer region(long offsetBytes, long capacityBytes, ByteOrder byteOrder)
+  {
+    return writableRegion(offsetBytes, capacityBytes, byteOrder);
+  }
+
+  @Override
+  public Memory asMemory(ByteOrder byteOrder)
+  {
+    return asWritableMemory(byteOrder);
+  }
+
+  @Override
+  public boolean getBoolean()
+  {
+    return buffer.get() == 0 ? false : true;
+  }
+
+  @Override
+  public void getBooleanArray(boolean[] dstArray, int dstOffsetBooleans, int lengthBooleans)
+  {
+    for (int i = 0; i < lengthBooleans; i++) {
+      dstArray[dstOffsetBooleans + i] = getBoolean();
+    }
+  }
+
+  @Override
+  public byte getByte()
+  {
+    return buffer.get();
+  }
+
+  @Override
+  public void getByteArray(byte[] dstArray, int dstOffsetBytes, int lengthBytes)
+  {
+    for (int i = 0; i < lengthBytes; i++) {
+      dstArray[dstOffsetBytes + i] = buffer.get();
+    }
+  }
+
+  @Override
+  public char getChar()
+  {
+    return buffer.getChar();
+  }
+
+  @Override
+  public void getCharArray(char[] dstArray, int dstOffsetChars, int lengthChars)
+  {
+    for (int i = 0; i < lengthChars; i++) {
+      dstArray[dstOffsetChars + i] = buffer.getChar();
+    }
+  }
+
+  @Override
+  public double getDouble()
+  {
+    return buffer.getDouble();
+  }
+
+  @Override
+  public void getDoubleArray(double[] dstArray, int dstOffsetDoubles, int lengthDoubles)
+  {
+    for (int i = 0; i < lengthDoubles; i++) {
+      dstArray[dstOffsetDoubles + i] = buffer.getDouble();
+    }
+  }
+
+  @Override
+  public float getFloat()
+  {
+    return buffer.getFloat();
+  }
+
+  @Override
+  public void getFloatArray(float[] dstArray, int dstOffsetFloats, int lengthFloats)
+  {
+    for (int i = 0; i < lengthFloats; i++) {
+      dstArray[dstOffsetFloats + i] = buffer.getFloat();
+    }
+  }
+
+  @Override
+  public int getInt()
+  {
+    return buffer.getInt();
+  }
+
+  @Override
+  public void getIntArray(int[] dstArray, int dstOffsetInts, int lengthInts)
+  {
+    for (int i = 0; i < lengthInts; i++) {
+      dstArray[dstOffsetInts + i] = buffer.getInt();
+    }
+  }
+
+  @Override
+  public long getLong()
+  {
+    return buffer.getLong();
+  }
+
+  @Override
+  public void getLongArray(long[] dstArray, int dstOffsetLongs, int lengthLongs)
+  {
+    for (int i = 0; i < lengthLongs; i++) {
+      dstArray[dstOffsetLongs + i] = buffer.getLong();
+    }
+  }
+
+  @Override
+  public short getShort()
+  {
+    return buffer.getShort();
+  }
+
+  @Override
+  public void getShortArray(short[] dstArray, int dstOffsetShorts, int lengthShorts)
+  {
+    for (int i = 0; i < lengthShorts; i++) {
+      dstArray[dstOffsetShorts + i] = buffer.getShort();
+    }
+  }
+
+  @Override
+  public int compareTo(
+      long thisOffsetBytes,
+      long thisLengthBytes,
+      Buffer that,
+      long thatOffsetBytes,
+      long thatLengthBytes
+  )
+  {
+    final int thisLength = Ints.checkedCast(thisLengthBytes);
+    final int thatLength = Ints.checkedCast(thatLengthBytes);
+
+    final int commonLength = Math.min(thisLength, thatLength);
+
+    for (int i = 0; i < commonLength; i++) {
+      final int cmp = Byte.compare(getByte(thisOffsetBytes + i), that.getByte(thatOffsetBytes + i));
+      if (cmp != 0) {
+        return cmp;
+      }
+    }
+
+    return Integer.compare(thisLength, thatLength);
+  }
+
+  @Override
+  public BaseBuffer incrementPosition(long increment)
+  {
+    buffer.position(buffer.position() + Ints.checkedCast(increment));
+    return this;
+  }
+
+  @Override
+  public BaseBuffer incrementAndCheckPosition(long increment)
+  {
+    checkInvariants(start, buffer.position() + increment, end, buffer.capacity());
+    return incrementPosition(increment);
+  }
+
+  @Override
+  public long getEnd()
+  {
+    return end;
+  }
+
+  @Override
+  public long getPosition()
+  {
+    return buffer.position();
+  }
+
+  @Override
+  public long getStart()
+  {
+    return start;
+  }
+
+  @Override
+  public long getRemaining()
+  {
+    return buffer.remaining();
+  }
+
+  @Override
+  public boolean hasRemaining()
+  {
+    return buffer.hasRemaining();
+  }
+
+  @Override
+  public BaseBuffer resetPosition()
+  {
+    buffer.position(start);
+    return this;
+  }
+
+  @Override
+  public BaseBuffer setPosition(long position)
+  {
+    buffer.position(Ints.checkedCast(position));
+    return this;
+  }
+
+  @Override
+  public BaseBuffer setAndCheckPosition(long position)
+  {
+    checkInvariants(start, position, end, buffer.capacity());
+    return setPosition(position);
+  }
+
+  @Override
+  public BaseBuffer setStartPositionEnd(long start, long position, long end)
+  {
+    this.start = Ints.checkedCast(start);
+    this.end = Ints.checkedCast(end);
+    buffer.position(Ints.checkedCast(position));
+    buffer.limit(this.end);
+    return this;
+  }
+
+  @Override
+  public BaseBuffer setAndCheckStartPositionEnd(long start, long position, long end)
+  {
+    checkInvariants(start, position, end, buffer.capacity());
+    return setStartPositionEnd(start, position, end);
+  }
+
+  @Override
+  public boolean equalTo(long thisOffsetBytes, Object that, long thatOffsetBytes, long lengthBytes)
+  {
+    if (!(that instanceof SafeWritableBuffer)) {
+      return false;
+    }
+    return compareTo(thisOffsetBytes, lengthBytes, (SafeWritableBuffer) that, thatOffsetBytes, lengthBytes) == 0;
+  }
+
+  /**
+   * Adapted from {@link org.apache.datasketches.memory.internal.BaseBufferImpl#checkInvariants(long, long, long, long)}
+   */
+  static void checkInvariants(final long start, final long pos, final long end, final long cap)
+  {
+    if ((start | pos | end | cap | (pos - start) | (end - pos) | (cap - end)) < 0L) {
+      throw new IllegalArgumentException(
+          "Violation of Invariants: "
+          + "start: " + start
+          + " <= pos: " + pos
+          + " <= end: " + end
+          + " <= cap: " + cap
+          + "; (pos - start): " + (pos - start)
+          + ", (end - pos): " + (end - pos)
+          + ", (cap - end): " + (cap - end)
+      );
+    }
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/segment/data/SafeWritableMemory.java b/processing/src/main/java/org/apache/druid/segment/data/SafeWritableMemory.java
new file mode 100644
index 000000000000..9006ac5cec9e
--- /dev/null
+++ b/processing/src/main/java/org/apache/druid/segment/data/SafeWritableMemory.java
@@ -0,0 +1,417 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment.data;
+
+import com.google.common.primitives.Ints;
+import org.apache.datasketches.memory.Buffer;
+import org.apache.datasketches.memory.Memory;
+import org.apache.datasketches.memory.Utf8CodingException;
+import org.apache.datasketches.memory.WritableBuffer;
+import org.apache.datasketches.memory.WritableMemory;
+import org.apache.druid.java.util.common.StringUtils;
+
+import java.io.IOException;
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+import java.nio.channels.WritableByteChannel;
+
+/**
+ * Safety first! Don't trust something whose contents you locations to read and write stuff to, but need a
+ * {@link Memory} or {@link WritableMemory}? use this!
+ * <p>
+ * Delegates everything to an underlying {@link ByteBuffer} so all read and write operations will have bounds checks
+ * built in rather than using 'unsafe'.
+ */
+public class SafeWritableMemory extends SafeWritableBase implements WritableMemory
+{
+  public static SafeWritableMemory wrap(byte[] bytes)
+  {
+    return wrap(ByteBuffer.wrap(bytes).order(ByteOrder.nativeOrder()), 0, bytes.length);
+  }
+
+  public static SafeWritableMemory wrap(ByteBuffer buffer)
+  {
+    return wrap(buffer.duplicate().order(buffer.order()), 0, buffer.capacity());
+  }
+
+  public static SafeWritableMemory wrap(ByteBuffer buffer, ByteOrder byteOrder)
+  {
+    return wrap(buffer.duplicate().order(byteOrder), 0, buffer.capacity());
+  }
+
+  public static SafeWritableMemory wrap(ByteBuffer buffer, int offset, int size)
+  {
+    final ByteBuffer dupe = buffer.duplicate().order(buffer.order());
+    dupe.position(offset);
+    dupe.limit(offset + size);
+    return new SafeWritableMemory(dupe.slice().order(buffer.order()));
+  }
+
+  public SafeWritableMemory(ByteBuffer buffer)
+  {
+    super(buffer);
+  }
+
+  @Override
+  public Memory region(long offsetBytes, long capacityBytes, ByteOrder byteOrder)
+  {
+    return writableRegion(offsetBytes, capacityBytes, byteOrder);
+  }
+
+  @Override
+  public Buffer asBuffer(ByteOrder byteOrder)
+  {
+    return asWritableBuffer(byteOrder);
+  }
+
+  @Override
+  public void getBooleanArray(long offsetBytes, boolean[] dstArray, int dstOffsetBooleans, int lengthBooleans)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int j = 0; j < lengthBooleans; j++) {
+      dstArray[dstOffsetBooleans + j] = buffer.get(offset + j) != 0;
+    }
+  }
+
+  @Override
+  public void getByteArray(long offsetBytes, byte[] dstArray, int dstOffsetBytes, int lengthBytes)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int j = 0; j < lengthBytes; j++) {
+      dstArray[dstOffsetBytes + j] = buffer.get(offset + j);
+    }
+  }
+
+  @Override
+  public void getCharArray(long offsetBytes, char[] dstArray, int dstOffsetChars, int lengthChars)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int j = 0; j < lengthChars; j++) {
+      dstArray[dstOffsetChars + j] = buffer.getChar(offset + (j * Character.BYTES));
+    }
+  }
+
+  @Override
+  public int getCharsFromUtf8(long offsetBytes, int utf8LengthBytes, Appendable dst)
+      throws IOException, Utf8CodingException
+  {
+    ByteBuffer dupe = buffer.asReadOnlyBuffer().order(buffer.order());
+    dupe.position(Ints.checkedCast(offsetBytes));
+    String s = StringUtils.fromUtf8(dupe, utf8LengthBytes);
+    dst.append(s);
+    return s.length();
+  }
+
+  @Override
+  public int getCharsFromUtf8(long offsetBytes, int utf8LengthBytes, StringBuilder dst) throws Utf8CodingException
+  {
+    ByteBuffer dupe = buffer.asReadOnlyBuffer().order(buffer.order());
+    dupe.position(Ints.checkedCast(offsetBytes));
+    String s = StringUtils.fromUtf8(dupe, utf8LengthBytes);
+    dst.append(s);
+    return s.length();
+  }
+
+  @Override
+  public void getDoubleArray(long offsetBytes, double[] dstArray, int dstOffsetDoubles, int lengthDoubles)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int j = 0; j < lengthDoubles; j++) {
+      dstArray[dstOffsetDoubles + j] = buffer.getDouble(offset + (j * Double.BYTES));
+    }
+  }
+
+  @Override
+  public void getFloatArray(long offsetBytes, float[] dstArray, int dstOffsetFloats, int lengthFloats)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int j = 0; j < lengthFloats; j++) {
+      dstArray[dstOffsetFloats + j] = buffer.getFloat(offset + (j * Float.BYTES));
+    }
+  }
+
+  @Override
+  public void getIntArray(long offsetBytes, int[] dstArray, int dstOffsetInts, int lengthInts)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int j = 0; j < lengthInts; j++) {
+      dstArray[dstOffsetInts + j] = buffer.getInt(offset + (j * Integer.BYTES));
+    }
+  }
+
+  @Override
+  public void getLongArray(long offsetBytes, long[] dstArray, int dstOffsetLongs, int lengthLongs)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int j = 0; j < lengthLongs; j++) {
+      dstArray[dstOffsetLongs + j] = buffer.getLong(offset + (j * Long.BYTES));
+    }
+  }
+
+  @Override
+  public void getShortArray(long offsetBytes, short[] dstArray, int dstOffsetShorts, int lengthShorts)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int j = 0; j < lengthShorts; j++) {
+      dstArray[dstOffsetShorts + j] = buffer.getShort(offset + (j * Short.BYTES));
+    }
+  }
+
+  @Override
+  public int compareTo(
+      long thisOffsetBytes,
+      long thisLengthBytes,
+      Memory that,
+      long thatOffsetBytes,
+      long thatLengthBytes
+  )
+  {
+    final int thisLength = Ints.checkedCast(thisLengthBytes);
+    final int thatLength = Ints.checkedCast(thatLengthBytes);
+
+    final int commonLength = Math.min(thisLength, thatLength);
+
+    for (int i = 0; i < commonLength; i++) {
+      final int cmp = Byte.compare(getByte(thisOffsetBytes + i), that.getByte(thatOffsetBytes + i));
+      if (cmp != 0) {
+        return cmp;
+      }
+    }
+
+    return Integer.compare(thisLength, thatLength);
+  }
+
+  @Override
+  public void copyTo(long srcOffsetBytes, WritableMemory destination, long dstOffsetBytes, long lengthBytes)
+  {
+    int offset = Ints.checkedCast(srcOffsetBytes);
+    for (int i = 0; i < lengthBytes; i++) {
+      destination.putByte(dstOffsetBytes + i, buffer.get(offset + i));
+    }
+  }
+
+  @Override
+  public void writeTo(long offsetBytes, long lengthBytes, WritableByteChannel out) throws IOException
+  {
+    ByteBuffer dupe = buffer.duplicate();
+    dupe.position(Ints.checkedCast(offsetBytes));
+    dupe.limit(dupe.position() + Ints.checkedCast(lengthBytes));
+    ByteBuffer view = dupe.slice();
+    view.order(buffer.order());
+    out.write(view);
+  }
+
+  @Override
+  public boolean equalTo(long thisOffsetBytes, Object that, long thatOffsetBytes, long lengthBytes)
+  {
+    if (!(that instanceof SafeWritableMemory)) {
+      return false;
+    }
+    return compareTo(thisOffsetBytes, lengthBytes, (SafeWritableMemory) that, thatOffsetBytes, lengthBytes) == 0;
+  }
+
+
+  @Override
+  public WritableMemory writableRegion(long offsetBytes, long capacityBytes, ByteOrder byteOrder)
+  {
+    final ByteBuffer dupe = buffer.duplicate().order(buffer.order());
+    final int sizeBytes = Ints.checkedCast(capacityBytes);
+    dupe.position(Ints.checkedCast(offsetBytes));
+    dupe.limit(dupe.position() + sizeBytes);
+    final ByteBuffer view = dupe.slice();
+    view.order(byteOrder);
+    return new SafeWritableMemory(view);
+  }
+
+  @Override
+  public WritableBuffer asWritableBuffer(ByteOrder byteOrder)
+  {
+    return new SafeWritableBuffer(buffer.duplicate().order(byteOrder));
+  }
+
+  @Override
+  public void putBooleanArray(long offsetBytes, boolean[] srcArray, int srcOffsetBooleans, int lengthBooleans)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int i = 0; i < lengthBooleans; i++) {
+      buffer.put(offset + i, (byte) (srcArray[i + srcOffsetBooleans] ? 1 : 0));
+    }
+  }
+
+  @Override
+  public void putByteArray(long offsetBytes, byte[] srcArray, int srcOffsetBytes, int lengthBytes)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int i = 0; i < lengthBytes; i++) {
+      buffer.put(offset + i, srcArray[srcOffsetBytes + i]);
+    }
+  }
+
+  @Override
+  public void putCharArray(long offsetBytes, char[] srcArray, int srcOffsetChars, int lengthChars)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int i = 0; i < lengthChars; i++) {
+      buffer.putChar(offset + (i * Character.BYTES), srcArray[srcOffsetChars + i]);
+    }
+  }
+
+  @Override
+  public long putCharsToUtf8(long offsetBytes, CharSequence src)
+  {
+    final byte[] bytes = StringUtils.toUtf8(src.toString());
+    putByteArray(offsetBytes, bytes, 0, bytes.length);
+    return bytes.length;
+  }
+
+  @Override
+  public void putDoubleArray(long offsetBytes, double[] srcArray, int srcOffsetDoubles, int lengthDoubles)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int i = 0; i < lengthDoubles; i++) {
+      buffer.putDouble(offset + (i * Double.BYTES), srcArray[srcOffsetDoubles + i]);
+    }
+  }
+
+  @Override
+  public void putFloatArray(long offsetBytes, float[] srcArray, int srcOffsetFloats, int lengthFloats)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int i = 0; i < lengthFloats; i++) {
+      buffer.putFloat(offset + (i * Float.BYTES), srcArray[srcOffsetFloats + i]);
+    }
+  }
+
+  @Override
+  public void putIntArray(long offsetBytes, int[] srcArray, int srcOffsetInts, int lengthInts)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int i = 0; i < lengthInts; i++) {
+      buffer.putInt(offset + (i * Integer.BYTES), srcArray[srcOffsetInts + i]);
+    }
+  }
+
+  @Override
+  public void putLongArray(long offsetBytes, long[] srcArray, int srcOffsetLongs, int lengthLongs)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int i = 0; i < lengthLongs; i++) {
+      buffer.putLong(offset + (i * Long.BYTES), srcArray[srcOffsetLongs + i]);
+    }
+  }
+
+  @Override
+  public void putShortArray(long offsetBytes, short[] srcArray, int srcOffsetShorts, int lengthShorts)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    for (int i = 0; i < lengthShorts; i++) {
+      buffer.putShort(offset + (i * Short.BYTES), srcArray[srcOffsetShorts + i]);
+    }
+  }
+
+  @Override
+  public long getAndAddLong(long offsetBytes, long delta)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    final long currentValue;
+    synchronized (buffer) {
+      currentValue = buffer.getLong(offset);
+      buffer.putLong(offset, currentValue + delta);
+    }
+    return currentValue;
+  }
+
+  @Override
+  public boolean compareAndSwapLong(long offsetBytes, long expect, long update)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    synchronized (buffer) {
+      final long actual = buffer.getLong(offset);
+      if (expect == actual) {
+        buffer.putLong(offset, update);
+        return true;
+      }
+    }
+    return false;
+  }
+
+  @Override
+  public long getAndSetLong(long offsetBytes, long newValue)
+  {
+    int offset = Ints.checkedCast(offsetBytes);
+    synchronized (buffer) {
+      long l = buffer.getLong(offset);
+      buffer.putLong(offset, newValue);
+      return l;
+    }
+  }
+
+  @Override
+  public Object getArray()
+  {
+    return null;
+  }
+
+  @Override
+  public void clear()
+  {
+    fill((byte) 0);
+  }
+
+  @Override
+  public void clear(long offsetBytes, long lengthBytes)
+  {
+    fill(offsetBytes, lengthBytes, (byte) 0);
+  }
+
+  @Override
+  public void clearBits(long offsetBytes, byte bitMask)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    int value = buffer.get(offset) & 0XFF;
+    value &= ~bitMask;
+    buffer.put(offset, (byte) value);
+  }
+
+  @Override
+  public void fill(byte value)
+  {
+    for (int i = 0; i < buffer.capacity(); i++) {
+      buffer.put(i, value);
+    }
+  }
+
+  @Override
+  public void fill(long offsetBytes, long lengthBytes, byte value)
+  {
+    int offset = Ints.checkedCast(offsetBytes);
+    int length = Ints.checkedCast(lengthBytes);
+    for (int i = 0; i < length; i++) {
+      buffer.put(offset + i, value);
+    }
+  }
+
+  @Override
+  public void setBits(long offsetBytes, byte bitMask)
+  {
+    final int offset = Ints.checkedCast(offsetBytes);
+    buffer.put(offset, (byte) (buffer.get(offset) | bitMask));
+  }
+}
diff --git a/processing/src/main/java/org/apache/druid/segment/nested/NestedDataColumnSerializer.java b/processing/src/main/java/org/apache/druid/segment/nested/NestedDataColumnSerializer.java
index f1d6c234dcd0..41b84a638e7c 100644
--- a/processing/src/main/java/org/apache/druid/segment/nested/NestedDataColumnSerializer.java
+++ b/processing/src/main/java/org/apache/druid/segment/nested/NestedDataColumnSerializer.java
@@ -407,9 +407,9 @@ public int write(ByteBuffer buffer, Integer value, int maxSizeBytes)
     }
 
     @Override
-    public int compare(Integer o1, Integer o2)
+    public int compare(Object o1, Object o2)
     {
-      return Integer.compare(o1, o2);
+      return Integer.compare(((Number) o1).intValue(), ((Number) o2).intValue());
     }
   }
 }
diff --git a/processing/src/main/java/org/apache/druid/segment/nested/NestedFieldLiteralColumnIndexSupplier.java b/processing/src/main/java/org/apache/druid/segment/nested/NestedFieldLiteralColumnIndexSupplier.java
index 373dcc822f2e..36c39f251b79 100644
--- a/processing/src/main/java/org/apache/druid/segment/nested/NestedFieldLiteralColumnIndexSupplier.java
+++ b/processing/src/main/java/org/apache/druid/segment/nested/NestedFieldLiteralColumnIndexSupplier.java
@@ -228,10 +228,10 @@ private <T> IntIntPair getLocalRangeFromDictionary(
       // valid global index in local dictionary, start here
       localStartIndex = localFound;
     }
-    // global end index is exclusive already, so we don't adjust local end index even for missing values
+
     int localEndFound = localDictionary.indexOf(globalEndIndex);
     if (localEndFound < 0) {
-      localEndIndex = -localEndFound;
+      localEndIndex = -(localEndFound + 1);
     } else {
       localEndIndex = localEndFound;
     }
@@ -239,6 +239,7 @@ private <T> IntIntPair getLocalRangeFromDictionary(
     localStartIndex = Math.min(localStartIndex, localDictionary.size());
     localEndIndex = Math.max(localStartIndex, Math.min(localDictionary.size(), localEndIndex));
 
+
     return new IntIntImmutablePair(localStartIndex, localEndIndex);
   }
 
diff --git a/processing/src/test/java/org/apache/druid/frame/key/RowKeyReaderTest.java b/processing/src/test/java/org/apache/druid/frame/key/RowKeyReaderTest.java
index 7a9131729539..48d940384270 100644
--- a/processing/src/test/java/org/apache/druid/frame/key/RowKeyReaderTest.java
+++ b/processing/src/test/java/org/apache/druid/frame/key/RowKeyReaderTest.java
@@ -30,6 +30,7 @@
 import org.junit.internal.matchers.ThrowableMessageMatcher;
 
 import java.util.Arrays;
+import java.util.Collections;
 import java.util.List;
 import java.util.stream.IntStream;
 
@@ -144,4 +145,41 @@ public void test_trim_beyondFullLength()
 
     MatcherAssert.assertThat(e, ThrowableMessageMatcher.hasMessage(CoreMatchers.containsString("Cannot trim")));
   }
+
+  @Test
+  public void test_trimmedKeyReader_zero()
+  {
+    RowKey trimmedKey = keyReader.trim(key, 0);
+    RowKeyReader trimmedKeyReader = keyReader.trimmedKeyReader(0);
+
+    Assert.assertEquals(
+        Collections.emptyList(),
+        trimmedKeyReader.read(trimmedKey)
+    );
+  }
+
+  @Test
+  public void test_trimmedKeyReader_one()
+  {
+    RowKey trimmedKey = keyReader.trim(key, 1);
+    RowKeyReader trimmedKeyReader = keyReader.trimmedKeyReader(1);
+
+    Assert.assertEquals(
+        objects.subList(0, 1),
+        trimmedKeyReader.read(trimmedKey)
+    );
+  }
+
+  @Test
+  public void test_trimmedKeyReader_oneLessThanFullLength()
+  {
+    final int numFields = signature.size() - 1;
+    RowKey trimmedKey = keyReader.trim(key, numFields);
+    RowKeyReader trimmedKeyReader = keyReader.trimmedKeyReader(numFields);
+
+    Assert.assertEquals(
+        objects.subList(0, numFields),
+        trimmedKeyReader.read(trimmedKey)
+    );
+  }
 }
diff --git a/processing/src/test/java/org/apache/druid/frame/testutil/FrameSequenceBuilder.java b/processing/src/test/java/org/apache/druid/frame/testutil/FrameSequenceBuilder.java
index 3fbd8ba3180d..de7de8dd0da4 100644
--- a/processing/src/test/java/org/apache/druid/frame/testutil/FrameSequenceBuilder.java
+++ b/processing/src/test/java/org/apache/druid/frame/testutil/FrameSequenceBuilder.java
@@ -24,7 +24,7 @@
 import org.apache.druid.frame.allocation.HeapMemoryAllocator;
 import org.apache.druid.frame.allocation.MemoryAllocator;
 import org.apache.druid.frame.key.SortColumn;
-import org.apache.druid.frame.write.FrameRowTooLargeException;
+import org.apache.druid.frame.processor.FrameRowTooLargeException;
 import org.apache.druid.frame.write.FrameWriter;
 import org.apache.druid.frame.write.FrameWriterFactory;
 import org.apache.druid.frame.write.FrameWriters;
diff --git a/processing/src/test/java/org/apache/druid/guice/StartupInjectorBuilderTest.java b/processing/src/test/java/org/apache/druid/guice/StartupInjectorBuilderTest.java
new file mode 100644
index 000000000000..a20cf33c7c06
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/guice/StartupInjectorBuilderTest.java
@@ -0,0 +1,138 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.guice;
+
+import com.google.inject.Injector;
+import org.apache.druid.utils.RuntimeInfo;
+import org.junit.Test;
+
+import java.util.Collections;
+import java.util.Properties;
+
+import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertNotNull;
+import static org.junit.Assert.assertNotSame;
+import static org.junit.Assert.assertNull;
+import static org.junit.Assert.assertSame;
+import static org.junit.Assert.assertTrue;
+
+public class StartupInjectorBuilderTest
+{
+  @Test
+  public void testEmpty()
+  {
+    Injector injector = new StartupInjectorBuilder().build();
+
+    // Empty properties come along for free
+    Properties props = injector.getInstance(Properties.class);
+    assertNotNull(props);
+    assertTrue(props.isEmpty());
+
+    // Since we didn't configure this item, we get a new instance every time.
+    assertNotSame(props, injector.getInstance(Properties.class));
+
+    // Runtime info is available, though not configured, because Guice can create
+    // one when requested. Our class, so marked singleton.
+    assertNotNull(injector.getInstance(RuntimeInfo.class));
+    assertSame(injector.getInstance(RuntimeInfo.class), injector.getInstance(RuntimeInfo.class));
+
+    // The extension loader is available, again via implicit creation.
+    // Since it is our class, we marked it as a lazy singleton.
+    assertNotNull(injector.getInstance(ExtensionsLoader.class));
+    assertSame(injector.getInstance(ExtensionsLoader.class), injector.getInstance(ExtensionsLoader.class));
+
+    // Does have the basics. Sample one such entry.
+    assertNotNull(injector.getInstance(DruidSecondaryModule.class));
+    assertSame(injector.getInstance(DruidSecondaryModule.class), injector.getInstance(DruidSecondaryModule.class));
+  }
+
+  @Test
+  public void testEmptyTestInjector()
+  {
+    Injector injector = new StartupInjectorBuilder().forTests().build();
+
+    // Empty properties come along for free
+    Properties props = injector.getInstance(Properties.class);
+    assertNotNull(props);
+    assertTrue(props.isEmpty());
+
+    // Since we didn't configure this item, we get a new instance every time.
+    assertNotSame(props, injector.getInstance(Properties.class));
+
+    // Runtime info bound to null.
+    assertNull(injector.getInstance(RuntimeInfo.class));
+
+    // The extension loader bound to null.
+    assertNull(injector.getInstance(ExtensionsLoader.class));
+
+    // Does have the basics. Sample one such entry.
+    assertNotNull(injector.getInstance(DruidSecondaryModule.class));
+    assertSame(injector.getInstance(DruidSecondaryModule.class), injector.getInstance(DruidSecondaryModule.class));
+  }
+
+  @Test
+  public void testEmptyProperties()
+  {
+    Injector injector = new StartupInjectorBuilder()
+        .withEmptyProperties()
+        .build();
+
+    // Single empty properties instance
+    Properties props = injector.getInstance(Properties.class);
+    assertNotNull(props);
+    assertTrue(props.isEmpty());
+
+    // Since we didn't configure this item, we get a new instance every time.
+    assertSame(props, injector.getInstance(Properties.class));
+  }
+
+  @Test
+  public void testExplicitProperties()
+  {
+    Properties props = new Properties();
+    props.put("foo", "bar");
+    Injector injector = new StartupInjectorBuilder()
+        .forTests()
+        .withProperties(props)
+        .build();
+
+    // Returns explicit properties
+    Properties propsInstance = injector.getInstance(Properties.class);
+    assertSame(props, propsInstance);
+  }
+
+  @Test
+  public void testExtensionsOption()
+  {
+    Properties props = new Properties();
+    props.put(ExtensionsConfig.PROPERTY_BASE + ".directory", "bogus");
+    props.put(ModulesConfig.PROPERTY_BASE + ".excludeList", "[\"excluded\"]");
+    Injector injector = new StartupInjectorBuilder()
+        .withExtensions()
+        .withProperties(props)
+        .build();
+
+    // Extensions config is populated. (Can't tests extensions themselves.)
+    assertEquals("bogus", injector.getInstance(ExtensionsConfig.class).getDirectory());
+    assertEquals(Collections.singletonList("excluded"), injector.getInstance(ModulesConfig.class).getExcludeList());
+  }
+
+  // Can't test the server option here: there are no actual property files to read.
+}
diff --git a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java
index f9060db4c94c..47be50997f23 100644
--- a/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java
+++ b/processing/src/test/java/org/apache/druid/query/groupby/GroupByQueryRunnerTest.java
@@ -757,8 +757,7 @@ public void testGroupBy()
         query,
         serviceEmitter
     );
-    Assert.assertEquals(1, serviceEmitter.getEvents().size());
-    Assert.assertEquals(vectorize, serviceEmitter.getEvents().get(0).toMap().getOrDefault("vectorized", null));
+    serviceEmitter.verifyEmitted("query/wait/time", ImmutableMap.of("vectorized", vectorize), 1);
     TestHelper.assertExpectedObjects(expectedResults, results, "groupBy");
   }
 
diff --git a/processing/src/test/java/org/apache/druid/query/operator/InlineScanOperator.java b/processing/src/test/java/org/apache/druid/query/operator/InlineScanOperator.java
new file mode 100644
index 000000000000..dbe2adf830d0
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/InlineScanOperator.java
@@ -0,0 +1,73 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.google.common.base.Preconditions;
+import com.google.common.collect.Iterators;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+
+import java.util.Iterator;
+import java.util.List;
+
+public class InlineScanOperator implements Operator
+{
+  public static InlineScanOperator make(RowsAndColumns item)
+  {
+    return new InlineScanOperator(Iterators.singletonIterator(item));
+  }
+
+  public static InlineScanOperator make(List<RowsAndColumns> items)
+  {
+    return new InlineScanOperator(items.iterator());
+  }
+
+  private Iterator<RowsAndColumns> iter;
+
+  public InlineScanOperator(
+      Iterator<RowsAndColumns> iter
+  )
+  {
+    Preconditions.checkNotNull(iter);
+    this.iter = iter;
+  }
+
+  @Override
+  public void open()
+  {
+  }
+
+  @Override
+  public RowsAndColumns next()
+  {
+    return iter.next();
+  }
+
+  @Override
+  public boolean hasNext()
+  {
+    return iter.hasNext();
+  }
+
+  @Override
+  public void close(boolean cascade)
+  {
+    iter = null;
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/NaivePartitioningOperatorTest.java b/processing/src/test/java/org/apache/druid/query/operator/NaivePartitioningOperatorTest.java
new file mode 100644
index 000000000000..5813f36630d1
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/NaivePartitioningOperatorTest.java
@@ -0,0 +1,105 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Arrays;
+import java.util.List;
+
+public class NaivePartitioningOperatorTest
+{
+  @Test
+  public void testDefaultImplementation()
+  {
+    RowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(
+        ImmutableMap.of(
+            "sorted", new IntArrayColumn(new int[]{0, 0, 0, 1, 1, 2, 4, 4, 4}),
+            "unsorted", new IntArrayColumn(new int[]{3, 54, 21, 1, 5, 54, 2, 3, 92})
+        )
+    );
+
+    NaivePartitioningOperator op = new NaivePartitioningOperator(
+        ImmutableList.of("sorted"),
+        InlineScanOperator.make(rac)
+    );
+
+    op.open();
+
+    List<RowsAndColumnsHelper> expectations = Arrays.asList(
+        new RowsAndColumnsHelper()
+            .expectColumn("sorted", new int[]{0, 0, 0})
+            .expectColumn("unsorted", new int[]{3, 54, 21}),
+        new RowsAndColumnsHelper()
+            .expectColumn("sorted", new int[]{1, 1})
+            .expectColumn("unsorted", new int[]{1, 5}),
+        new RowsAndColumnsHelper()
+            .expectColumn("sorted", new int[]{2})
+            .expectColumn("unsorted", new int[]{54}),
+        new RowsAndColumnsHelper()
+            .expectColumn("sorted", new int[]{4, 4, 4})
+            .expectColumn("unsorted", new int[]{2, 3, 92})
+    );
+
+    for (RowsAndColumnsHelper expectation : expectations) {
+      Assert.assertTrue(op.hasNext());
+      expectation.validate(op.next());
+    }
+    Assert.assertFalse(op.hasNext());
+
+    op.close(true);
+  }
+
+  @Test
+  public void testFailUnsorted()
+  {
+    RowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(
+        ImmutableMap.of(
+            "sorted", new IntArrayColumn(new int[]{0, 0, 0, 1, 1, 2, 4, 4, 4}),
+            "unsorted", new IntArrayColumn(new int[]{3, 54, 21, 1, 5, 54, 2, 3, 92})
+        )
+    );
+
+    NaivePartitioningOperator op = new NaivePartitioningOperator(
+        ImmutableList.of("unsorted"),
+        InlineScanOperator.make(rac)
+    );
+
+    op.open();
+
+    boolean exceptionThrown = false;
+    try {
+      op.next();
+    }
+    catch (ISE ex) {
+      Assert.assertEquals("Pre-sorted data required, rows[1] and [2] were not in order", ex.getMessage());
+      exceptionThrown = true;
+    }
+    Assert.assertTrue(exceptionThrown);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/OperatorSequenceTest.java b/processing/src/test/java/org/apache/druid/query/operator/OperatorSequenceTest.java
new file mode 100644
index 000000000000..5d114b8bb2aa
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/OperatorSequenceTest.java
@@ -0,0 +1,56 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import org.apache.druid.java.util.common.guava.Yielder;
+import org.apache.druid.java.util.common.guava.YieldingAccumulator;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.junit.Assert;
+import org.junit.Test;
+
+public class OperatorSequenceTest
+{
+  @Test
+  public void testSanity()
+  {
+    OperatorSequence seq = new OperatorSequence(
+        () -> InlineScanOperator.make(MapOfColumnsRowsAndColumns.of("hi", new IntArrayColumn(new int[]{1})))
+    );
+
+    Assert.assertEquals(1, seq.accumulate(0, (accumulated, in) -> accumulated + 1).intValue());
+
+    Yielder<Integer> yielder = seq.toYielder(0, new YieldingAccumulator<Integer, RowsAndColumns>()
+    {
+      @Override
+      public Integer accumulate(Integer accumulated, RowsAndColumns in)
+      {
+        yield();
+        return accumulated + 1;
+      }
+    });
+    Assert.assertFalse(yielder.isDone());
+    Assert.assertEquals(1, yielder.get().intValue());
+
+    yielder = yielder.next(0);
+    Assert.assertTrue(yielder.isDone());
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/SequenceOperatorTest.java b/processing/src/test/java/org/apache/druid/query/operator/SequenceOperatorTest.java
new file mode 100644
index 000000000000..09f52562d4b9
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/SequenceOperatorTest.java
@@ -0,0 +1,56 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import org.apache.druid.java.util.common.guava.Sequences;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Arrays;
+
+public class SequenceOperatorTest
+{
+  @Test
+  public void testSanity()
+  {
+    SequenceOperator op = new SequenceOperator(Sequences.simple(Arrays.asList(
+        MapOfColumnsRowsAndColumns.of("hi", new IntArrayColumn(new int[]{1})),
+        MapOfColumnsRowsAndColumns.of("hi", new IntArrayColumn(new int[]{1}))
+    )));
+
+    op.open();
+
+    RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("hi", new int[]{1})
+        .allColumnsRegistered();
+
+    expectations.validate(op.next());
+    Assert.assertTrue(op.hasNext());
+
+    expectations.validate(op.next());
+    Assert.assertFalse(op.hasNext());
+
+    op.close(true);
+    op.close(false);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/WindowOperatorQueryTest.java b/processing/src/test/java/org/apache/druid/query/operator/WindowOperatorQueryTest.java
new file mode 100644
index 000000000000..dc2e6e9732d4
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/WindowOperatorQueryTest.java
@@ -0,0 +1,124 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.google.common.collect.ImmutableMap;
+import org.apache.druid.java.util.common.IAE;
+import org.apache.druid.query.InlineDataSource;
+import org.apache.druid.query.QueryContext;
+import org.apache.druid.query.TableDataSource;
+import org.apache.druid.segment.column.RowSignature;
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Test;
+
+import java.util.ArrayList;
+import java.util.Set;
+
+/**
+ * Tests the WindowOperatorQuery, it would actually be a lot better to run this through some tests that actually
+ * validate the operation of queries, but all of the efforts to build out test scaffolding and framework have gone
+ * into building things out for SQL query operations.  As such, all of the tests that validating the actual native
+ * functionality actually run from the `druid-sql` module instead of this module.  It would be best to de-couple
+ * these and have all of the native, query processing tests happen directly here in processing and have the SQL
+ * tests only concern themselves with how they plan SQL into Native, but that's a bit big of a nugget to bite off
+ * at this point in time, so instead we continue the building of technical debt by making this "test" run lines
+ * of code without actually testing much meaningful behavior.
+ * <p>
+ * For now, view CalciteWindowQueryTest for actual tests that validate behavior.
+ */
+public class WindowOperatorQueryTest
+{
+  WindowOperatorQuery query;
+
+  @Before
+  public void setUp()
+  {
+    query = new WindowOperatorQuery(
+        InlineDataSource.fromIterable(new ArrayList<>(), RowSignature.empty()),
+        ImmutableMap.of("sally", "sue"),
+        RowSignature.empty(),
+        new ArrayList<>()
+    );
+  }
+
+  @Test
+  public void getOperators()
+  {
+    Assert.assertTrue(query.getOperators().isEmpty());
+  }
+
+  @Test
+  public void getRowSignature()
+  {
+    Assert.assertEquals(0, query.getRowSignature().size());
+  }
+
+  @Test
+  public void hasFilters()
+  {
+    Assert.assertFalse(query.hasFilters());
+  }
+
+  @Test
+  public void getFilter()
+  {
+    Assert.assertNull(query.getFilter());
+  }
+
+  @Test
+  public void getType()
+  {
+    Assert.assertEquals("windowOperator", query.getType());
+  }
+
+  @Test
+  public void withOverriddenContext()
+  {
+    Assert.assertEquals("sue", query.context().get("sally"));
+    final QueryContext context = query.withOverriddenContext(ImmutableMap.of("sally", "soo")).context();
+    Assert.assertEquals("soo", context.get("sally"));
+  }
+
+  @Test
+  public void withDataSource()
+  {
+    final Set<String> tableNames = query.getDataSource().getTableNames();
+    Assert.assertEquals(0, tableNames.size());
+
+    boolean exceptionThrown = false;
+    try {
+      query.withDataSource(new TableDataSource("bob"));
+    }
+    catch (IAE e) {
+      // should fail trying to set a TableDataSource as TableDataSource is not currently allowed.
+      exceptionThrown = true;
+    }
+    Assert.assertTrue(exceptionThrown);
+  }
+
+  @Test
+  public void testEquals()
+  {
+    Assert.assertEquals(query, query);
+    Assert.assertEquals(query, query.withDataSource(query.getDataSource()));
+    Assert.assertNotEquals(query, query.toString());
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/WindowProcessorOperatorTest.java b/processing/src/test/java/org/apache/druid/query/operator/WindowProcessorOperatorTest.java
new file mode 100644
index 000000000000..39ba5996d5d4
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/WindowProcessorOperatorTest.java
@@ -0,0 +1,66 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator;
+
+import com.google.common.collect.ImmutableMap;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.junit.Assert;
+import org.junit.Test;
+
+public class WindowProcessorOperatorTest
+{
+  @Test
+  public void testJustRunsTheProcessor()
+  {
+    RowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(
+        ImmutableMap.of(
+            "colA", new IntArrayColumn(new int[]{1, 2, 3}),
+            "colB", new IntArrayColumn(new int[]{3, 2, 1})
+        )
+    );
+
+    WindowProcessorOperator op = new WindowProcessorOperator(
+        new Processor()
+        {
+          @Override
+          public RowsAndColumns process(RowsAndColumns incomingPartition)
+          {
+            return incomingPartition;
+          }
+
+          @Override
+          public boolean validateEquivalent(Processor otherProcessor)
+          {
+            return true;
+          }
+        },
+        InlineScanOperator.make(rac)
+    );
+
+    op.open();
+    Assert.assertTrue(op.hasNext());
+    Assert.assertSame(rac, op.next());
+    Assert.assertFalse(op.hasNext());
+    op.close(true);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/ComposingProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/ComposingProcessorTest.java
new file mode 100644
index 000000000000..570cba65d92c
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/ComposingProcessorTest.java
@@ -0,0 +1,74 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window;
+
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.junit.Assert;
+import org.junit.Test;
+
+public class ComposingProcessorTest
+{
+  @Test
+  public void testSanity()
+  {
+    final ProcessorForTesting firstProcessor = new ProcessorForTesting();
+    final ProcessorForTesting secondProcessor = new ProcessorForTesting();
+
+    ComposingProcessor proc = new ComposingProcessor(firstProcessor, secondProcessor);
+
+    proc.process(null);
+    Assert.assertEquals(1, firstProcessor.processCounter);
+    Assert.assertEquals(1, secondProcessor.processCounter);
+
+    proc.process(null);
+    Assert.assertEquals(2, firstProcessor.processCounter);
+    Assert.assertEquals(2, secondProcessor.processCounter);
+
+    Assert.assertTrue(proc.validateEquivalent(proc));
+    Assert.assertEquals(1, firstProcessor.validateCounter);
+    Assert.assertEquals(1, secondProcessor.validateCounter);
+
+    firstProcessor.validationResult = false;
+    Assert.assertFalse(proc.validateEquivalent(proc));
+    Assert.assertEquals(2, firstProcessor.validateCounter);
+    Assert.assertEquals(1, secondProcessor.validateCounter);
+  }
+
+  private static class ProcessorForTesting implements Processor
+  {
+    private int processCounter = 0;
+    private int validateCounter = 0;
+    private boolean validationResult = true;
+
+    @Override
+    public RowsAndColumns process(RowsAndColumns incomingPartition)
+    {
+      ++processCounter;
+      return incomingPartition;
+    }
+
+    @Override
+    public boolean validateEquivalent(Processor otherProcessor)
+    {
+      ++validateCounter;
+      return validationResult;
+    }
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/RowsAndColumnsHelper.java b/processing/src/test/java/org/apache/druid/query/operator/window/RowsAndColumnsHelper.java
new file mode 100644
index 000000000000..451ead6a9396
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/RowsAndColumnsHelper.java
@@ -0,0 +1,269 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window;
+
+import com.google.common.collect.ImmutableSet;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.segment.column.ColumnType;
+import org.junit.Assert;
+
+import java.util.Collection;
+import java.util.LinkedHashMap;
+import java.util.Map;
+import java.util.Set;
+
+public class RowsAndColumnsHelper
+{
+  public static void assertEquals(RowsAndColumns rac, String name, int[] expectedResults)
+  {
+    final Column column = rac.findColumn(name);
+    Assert.assertNotNull(column);
+    final ColumnAccessor accessor = column.toAccessor();
+    Assert.assertEquals(expectedResults.length, accessor.numRows());
+    for (int i = 0; i < expectedResults.length; ++i) {
+      Assert.assertEquals(StringUtils.format("%s[%s]", name, i), expectedResults[i], accessor.getInt(i));
+    }
+  }
+
+  public static void assertEquals(RowsAndColumns rac, String name, long[] expectedResults)
+  {
+    final Column column = rac.findColumn(name);
+    Assert.assertNotNull(column);
+    final ColumnAccessor accessor = column.toAccessor();
+    Assert.assertEquals(expectedResults.length, accessor.numRows());
+    for (int i = 0; i < expectedResults.length; ++i) {
+      Assert.assertEquals(StringUtils.format("%s[%s]", name, i), expectedResults[i], accessor.getLong(i));
+    }
+  }
+
+  public static void assertEquals(RowsAndColumns rac, String name, double[] expectedResults)
+  {
+    final Column column = rac.findColumn(name);
+    Assert.assertNotNull(column);
+    final ColumnAccessor accessor = column.toAccessor();
+    Assert.assertEquals(expectedResults.length, accessor.numRows());
+    for (int i = 0; i < expectedResults.length; ++i) {
+      Assert.assertEquals(StringUtils.format("%s[%s]", name, i), expectedResults[i], accessor.getDouble(i), 0.0d);
+    }
+  }
+
+  private final Map<String, ColumnHelper> helpers = new LinkedHashMap<>();
+  private Set<String> fullColumnSet;
+
+  public RowsAndColumnsHelper()
+  {
+  }
+
+  public RowsAndColumnsHelper expectColumn(String col, int[] expectedVals)
+  {
+    final ColumnHelper helper = columnHelper(col, expectedVals.length, ColumnType.LONG);
+    helper.setExpectation(expectedVals);
+    return this;
+  }
+
+  public RowsAndColumnsHelper expectColumn(String col, long[] expectedVals)
+  {
+    final ColumnHelper helper = columnHelper(col, expectedVals.length, ColumnType.LONG);
+    helper.setExpectation(expectedVals);
+    return this;
+  }
+
+  public RowsAndColumnsHelper expectColumn(String col, double[] expectedVals)
+  {
+    final ColumnHelper helper = columnHelper(col, expectedVals.length, ColumnType.DOUBLE);
+    helper.setExpectation(expectedVals);
+    return this;
+  }
+
+  public ColumnHelper columnHelper(String column, int expectedSize, ColumnType expectedType)
+  {
+    ColumnHelper retVal = helpers.get(column);
+    if (retVal == null) {
+      retVal = new ColumnHelper(expectedSize, expectedType);
+      helpers.put(column, retVal);
+      return retVal;
+    } else {
+      throw new ISE(
+          "column[%s] expectations already defined, size[%s], type[%s]",
+          column,
+          retVal.expectedVals.length,
+          retVal.expectedType
+      );
+    }
+  }
+
+  public RowsAndColumnsHelper expectFullColumns(Set<String> fullColumnSet)
+  {
+    this.fullColumnSet = fullColumnSet;
+    return this;
+  }
+
+  public RowsAndColumnsHelper allColumnsRegistered()
+  {
+    this.fullColumnSet = ImmutableSet.copyOf(helpers.keySet());
+    return this;
+  }
+
+  public void validate(RowsAndColumns rac)
+  {
+    validate("", rac);
+  }
+
+  public void validate(String name, RowsAndColumns rac)
+  {
+    if (fullColumnSet != null) {
+      final Collection<String> columnNames = rac.getColumnNames();
+      Assert.assertEquals(name, fullColumnSet.size(), columnNames.size());
+      Assert.assertTrue(name, fullColumnSet.containsAll(columnNames));
+    }
+
+    for (Map.Entry<String, ColumnHelper> entry : helpers.entrySet()) {
+      entry.getValue().validate(StringUtils.format("%s.%s", name, entry.getKey()), rac.findColumn(entry.getKey()));
+    }
+  }
+
+  public static class ColumnHelper
+  {
+    private final ColumnType expectedType;
+    private final Object[] expectedVals;
+    private final boolean[] expectedNulls;
+
+    public ColumnHelper(int expectedSize, ColumnType expectedType)
+    {
+      this.expectedType = expectedType;
+      this.expectedVals = new Object[expectedSize];
+      this.expectedNulls = new boolean[expectedVals.length];
+    }
+
+    public ColumnHelper setExpectation(int[] expectedVals)
+    {
+      for (int i = 0; i < expectedVals.length; i++) {
+        this.expectedVals[i] = expectedVals[i];
+      }
+      return this;
+    }
+
+    public ColumnHelper setExpectation(long[] expectedVals)
+    {
+      for (int i = 0; i < expectedVals.length; i++) {
+        this.expectedVals[i] = expectedVals[i];
+      }
+      return this;
+    }
+
+    public ColumnHelper setExpectation(double[] expectedVals)
+    {
+      for (int i = 0; i < expectedVals.length; i++) {
+        this.expectedVals[i] = expectedVals[i];
+      }
+      return this;
+    }
+
+    public ColumnHelper setExpectation(float[] expectedVals)
+    {
+      for (int i = 0; i < expectedVals.length; i++) {
+        this.expectedVals[i] = expectedVals[i];
+      }
+      return this;
+    }
+
+    public ColumnHelper setExpectation(Object[] expectedVals)
+    {
+      System.arraycopy(expectedVals, 0, this.expectedVals, 0, expectedVals.length);
+      return this;
+    }
+
+    public ColumnHelper setNulls(int[] nullIndexes)
+    {
+      for (int nullIndex : nullIndexes) {
+        this.expectedNulls[nullIndex] = true;
+      }
+      return this;
+    }
+
+    public void validate(String msgBase, Column col)
+    {
+      final ColumnAccessor accessor = col.toAccessor();
+
+      Assert.assertEquals(msgBase, expectedType, accessor.getType());
+      Assert.assertEquals(msgBase, expectedVals.length, accessor.numRows());
+      for (int i = 0; i < accessor.numRows(); ++i) {
+        final String msg = StringUtils.format("%s[%s]", msgBase, i);
+        Object expectedVal = expectedVals[i];
+        if (expectedVal == null) {
+          Assert.assertTrue(msg, expectedNulls[i]);
+          Assert.assertTrue(msg, accessor.isNull(i));
+          Assert.assertNull(msg, accessor.getObject(i));
+        }
+        if (expectedVal instanceof Float) {
+          if (expectedNulls[i]) {
+            Assert.assertTrue(msg, accessor.isNull(i));
+            Assert.assertEquals(msg, 0.0f, accessor.getFloat(i), 0.0);
+          } else {
+            Assert.assertFalse(msg, accessor.isNull(i));
+            Assert.assertEquals(msg, (Float) expectedVal, accessor.getFloat(i), 0.0);
+          }
+        } else if (expectedVal instanceof Double) {
+          if (expectedNulls[i]) {
+            Assert.assertTrue(msg, accessor.isNull(i));
+            Assert.assertEquals(msg, 0.0d, accessor.getDouble(i), 0.0);
+          } else {
+            Assert.assertFalse(msg, accessor.isNull(i));
+            Assert.assertEquals(msg, (Double) expectedVal, accessor.getDouble(i), 0.0);
+          }
+        } else if (expectedVal instanceof Integer) {
+          if (expectedNulls[i]) {
+            Assert.assertTrue(msg, accessor.isNull(i));
+            Assert.assertEquals(msg, 0, accessor.getInt(i));
+          } else {
+            Assert.assertFalse(msg, accessor.isNull(i));
+            Assert.assertEquals(msg, ((Integer) expectedVal).intValue(), accessor.getInt(i));
+          }
+        } else if (expectedVal instanceof Long) {
+          if (expectedNulls[i]) {
+            Assert.assertTrue(msg, accessor.isNull(i));
+            Assert.assertEquals(msg, 0, accessor.getLong(i));
+          } else {
+            Assert.assertFalse(msg, accessor.isNull(i));
+            Assert.assertEquals(msg, ((Long) expectedVal).longValue(), accessor.getLong(i));
+          }
+        } else {
+          if (expectedNulls[i]) {
+            Assert.assertTrue(msg, accessor.isNull(i));
+            Assert.assertNull(msg, accessor.getObject(i));
+            // asserting null on the expected value is here for consistency in the tests.  If it fails, it's most
+            // likely indicative of something wrong with the test setup than the actual logic, we keep it for
+            // sanity's sake to things consistent.
+            Assert.assertNull(msg, expectedVals[i]);
+          } else {
+            final Object obj = accessor.getObject(i);
+            Assert.assertFalse(msg, accessor.isNull(i));
+            Assert.assertNotNull(msg, obj);
+            Assert.assertEquals(msg, expectedVals[i], obj);
+          }
+        }
+      }
+    }
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/WindowAggregateProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/WindowAggregateProcessorTest.java
new file mode 100644
index 000000000000..856dd0a30421
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/WindowAggregateProcessorTest.java
@@ -0,0 +1,115 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window;
+
+import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.query.aggregation.DoubleMaxAggregatorFactory;
+import org.apache.druid.query.aggregation.DoubleSumAggregatorFactory;
+import org.apache.druid.query.aggregation.LongMaxAggregatorFactory;
+import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
+import org.apache.druid.query.operator.window.ranking.WindowRowNumberProcessor;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.DoubleArrayColumn;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.column.ObjectArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.apache.druid.segment.column.ColumnType;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowAggregateProcessorTest
+{
+  static {
+    NullHandling.initializeForTests();
+  }
+
+  @Test
+  public void testAggregation()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("intCol", new IntArrayColumn(new int[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("doubleCol", new DoubleArrayColumn(new double[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("objectCol", new ObjectArrayColumn(
+                new String[]{"a", "b", "c", "d", "e", "f", "g", "h", "i", "j"},
+                ColumnType.STRING
+            )
+    );
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    WindowAggregateProcessor processor = new WindowAggregateProcessor(
+        Arrays.asList(
+            new LongSumAggregatorFactory("sumFromLong", "intCol"),
+            new LongSumAggregatorFactory("sumFromDouble", "doubleCol"),
+            new DoubleMaxAggregatorFactory("maxFromInt", "intCol"),
+            new DoubleMaxAggregatorFactory("maxFromDouble", "doubleCol")
+        ),
+        Arrays.asList(
+            new LongMaxAggregatorFactory("cummMax", "intCol"),
+            new DoubleSumAggregatorFactory("cummSum", "doubleCol")
+        )
+    );
+
+    RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("intCol", new int[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("doubleCol", new double[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("sumFromLong", new long[]{45, 45, 45, 45, 45, 45, 45, 45, 45, 45})
+        .expectColumn("sumFromDouble", new long[]{45, 45, 45, 45, 45, 45, 45, 45, 45, 45})
+        .expectColumn("maxFromInt", new double[]{9, 9, 9, 9, 9, 9, 9, 9, 9, 9})
+        .expectColumn("maxFromDouble", new double[]{9, 9, 9, 9, 9, 9, 9, 9, 9, 9})
+        .expectColumn("cummMax", new long[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("cummSum", new double[]{0, 1, 3, 6, 10, 15, 21, 28, 36, 45});
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+  }
+
+  @Test
+  public void testValidateEquality()
+  {
+    WindowAggregateProcessor processor = new WindowAggregateProcessor(
+        Arrays.asList(
+            new LongSumAggregatorFactory("sumFromLong", "intCol"),
+            new LongSumAggregatorFactory("sumFromDouble", "doubleCol"),
+            new DoubleMaxAggregatorFactory("maxFromInt", "intCol"),
+            new DoubleMaxAggregatorFactory("maxFromDouble", "doubleCol")
+        ),
+        Arrays.asList(
+            new LongMaxAggregatorFactory("cummMax", "intCol"),
+            new DoubleSumAggregatorFactory("cummSum", "doubleCol")
+        )
+    );
+
+    Assert.assertTrue(processor.validateEquivalent(processor));
+    Assert.assertFalse(processor.validateEquivalent(new WindowRowNumberProcessor("bob")));
+    Assert.assertFalse(processor.validateEquivalent(new WindowAggregateProcessor(processor.getAggregations(), null)));
+    Assert.assertFalse(processor.validateEquivalent(
+        new WindowAggregateProcessor(new ArrayList<>(), processor.getCumulativeAggregations())
+    ));
+    Assert.assertFalse(processor.validateEquivalent(new WindowAggregateProcessor(new ArrayList<>(), null)));
+  }
+
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowCumeDistProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowCumeDistProcessorTest.java
new file mode 100644
index 000000000000..7b0bf1448170
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowCumeDistProcessorTest.java
@@ -0,0 +1,53 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.junit.Test;
+
+import java.util.Collections;
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowCumeDistProcessorTest
+{
+  @Test
+  public void testCumeDistProcessing()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("vals", new IntArrayColumn(new int[]{7, 18, 18, 30, 120, 121, 122, 122, 8290, 8290}));
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    Processor processor = new WindowCumeDistProcessor(Collections.singletonList("vals"), "CumeDist");
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("vals", new int[]{7, 18, 18, 30, 120, 121, 122, 122, 8290, 8290})
+        .expectColumn("CumeDist", new double[]{0.1, 0.3, 0.3, 0.4, 0.5, 0.6, 0.8, 0.8, 1.0, 1.0});
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowDenseRankProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowDenseRankProcessorTest.java
new file mode 100644
index 000000000000..d61c40ca48e2
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowDenseRankProcessorTest.java
@@ -0,0 +1,54 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.junit.Test;
+
+import java.util.Collections;
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowDenseRankProcessorTest
+{
+  @Test
+  public void testDenseRankProcessing()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("vals", new IntArrayColumn(new int[]{7, 18, 18, 30, 120, 121, 122, 122, 8290, 8290}));
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    Processor processor = new WindowDenseRankProcessor(Collections.singletonList("vals"), "DenseRank");
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("vals", new int[]{7, 18, 18, 30, 120, 121, 122, 122, 8290, 8290})
+        .expectColumn("DenseRank", new int[]{1, 2, 2, 3, 4, 5, 6, 6, 7, 7});
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowPercentileProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowPercentileProcessorTest.java
new file mode 100644
index 000000000000..cc6473f10a97
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowPercentileProcessorTest.java
@@ -0,0 +1,84 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import org.apache.druid.query.operator.window.ComposingProcessor;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.DoubleArrayColumn;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.column.ObjectArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.apache.druid.segment.column.ColumnType;
+import org.junit.Test;
+
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowPercentileProcessorTest
+{
+  @Test
+  public void testPercentileProcessing()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("intCol", new IntArrayColumn(new int[]{88, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("doubleCol", new DoubleArrayColumn(new double[]{0.4728, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("objectCol", new ObjectArrayColumn(
+        new String[]{"a", "b", "c", "d", "e", "f", "g", "h", "i", "j"},
+        ColumnType.STRING
+    ));
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    Processor processor = new ComposingProcessor(
+        new WindowPercentileProcessor("1", 1),
+        new WindowPercentileProcessor("2", 2),
+        new WindowPercentileProcessor("3", 3),
+        new WindowPercentileProcessor("4", 4),
+        new WindowPercentileProcessor("5", 5),
+        new WindowPercentileProcessor("6", 6),
+        new WindowPercentileProcessor("7", 7),
+        new WindowPercentileProcessor("8", 8),
+        new WindowPercentileProcessor("9", 9),
+        new WindowPercentileProcessor("10", 10),
+        new WindowPercentileProcessor("10292", 10292)
+    );
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("intCol", new int[]{88, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("doubleCol", new double[]{0.4728, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("1", new int[]{1, 1, 1, 1, 1, 1, 1, 1, 1, 1})
+        .expectColumn("2", new int[]{1, 1, 1, 1, 1, 2, 2, 2, 2, 2})
+        .expectColumn("3", new int[]{1, 1, 1, 1, 2, 2, 2, 3, 3, 3})
+        .expectColumn("4", new int[]{1, 1, 1, 2, 2, 2, 3, 3, 4, 4})
+        .expectColumn("5", new int[]{1, 1, 2, 2, 3, 3, 4, 4, 5, 5})
+        .expectColumn("6", new int[]{1, 1, 2, 2, 3, 3, 4, 4, 5, 6})
+        .expectColumn("7", new int[]{1, 1, 2, 2, 3, 3, 4, 5, 6, 7})
+        .expectColumn("8", new int[]{1, 1, 2, 2, 3, 4, 5, 6, 7, 8})
+        .expectColumn("9", new int[]{1, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("10", new int[]{1, 2, 3, 4, 5, 6, 7, 8, 9, 10})
+        .expectColumn("10292", new int[]{1, 2, 3, 4, 5, 6, 7, 8, 9, 10});
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowRankProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowRankProcessorTest.java
new file mode 100644
index 000000000000..3f004a6fd26b
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowRankProcessorTest.java
@@ -0,0 +1,84 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import org.apache.druid.query.operator.window.ComposingProcessor;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.junit.Test;
+
+import java.util.Collections;
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowRankProcessorTest
+{
+  @Test
+  public void testRankProcessing()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("vals", new IntArrayColumn(new int[]{7, 18, 18, 30, 120, 121, 122, 122, 8290, 8290}));
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    Processor processor = new ComposingProcessor(
+        new WindowRankProcessor(Collections.singletonList("vals"), "rank", false),
+        new WindowRankProcessor(Collections.singletonList("vals"), "rankAsPercent", true)
+    );
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("vals", new int[]{7, 18, 18, 30, 120, 121, 122, 122, 8290, 8290})
+        .expectColumn("rank", new int[]{1, 2, 2, 4, 5, 6, 7, 7, 9, 9})
+        .expectColumn(
+            "rankAsPercent",
+            new double[]{0.0, 1 / 9d, 1 / 9d, 3 / 9d, 4 / 9d, 5 / 9d, 6 / 9d, 6 / 9d, 8 / 9d, 8 / 9d}
+        );
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+
+  }
+
+  @Test
+  public void testRankSingle()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("vals", new IntArrayColumn(new int[]{7}));
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    Processor processor = new ComposingProcessor(
+        new WindowRankProcessor(Collections.singletonList("vals"), "rank", false),
+        new WindowRankProcessor(Collections.singletonList("vals"), "rankAsPercent", true)
+    );
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("vals", new int[]{7})
+        .expectColumn("rank", new int[]{1})
+        .expectColumn("rankAsPercent", new double[]{0.0});
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowRowNumberProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowRowNumberProcessorTest.java
new file mode 100644
index 000000000000..bc06de60e880
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/ranking/WindowRowNumberProcessorTest.java
@@ -0,0 +1,61 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.ranking;
+
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.DoubleArrayColumn;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.column.ObjectArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.apache.druid.segment.column.ColumnType;
+import org.junit.Test;
+
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowRowNumberProcessorTest
+{
+  @Test
+  public void testRowNumberProcessing()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("intCol", new IntArrayColumn(new int[]{88, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("doubleCol", new DoubleArrayColumn(new double[]{0.4728, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("objectCol", new ObjectArrayColumn(
+        new String[]{"a", "b", "c", "d", "e", "f", "g", "h", "i", "j"},
+        ColumnType.STRING
+    ));
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    Processor processor = new WindowRowNumberProcessor("rowRow");
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("intCol", new int[]{88, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("doubleCol", new double[]{0.4728, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("rowRow", new int[]{1, 2, 3, 4, 5, 6, 7, 8, 9, 10});
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowFirstProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowFirstProcessorTest.java
new file mode 100644
index 000000000000..425ff9036012
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowFirstProcessorTest.java
@@ -0,0 +1,80 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.value;
+
+import org.apache.druid.query.operator.window.ComposingProcessor;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.DoubleArrayColumn;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.column.ObjectArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.apache.druid.segment.column.ColumnType;
+import org.junit.Test;
+
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowFirstProcessorTest
+{
+  @Test
+  public void testFirstProcessing()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("intCol", new IntArrayColumn(new int[]{88, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("doubleCol", new DoubleArrayColumn(new double[]{0.4728, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("objectCol", new ObjectArrayColumn(
+        new String[]{"a", "b", "c", "d", "e", "f", "g", "h", "i", "j"},
+        ColumnType.STRING
+    ));
+    map.put("nullFirstCol", new ObjectArrayColumn(
+        new String[]{null, "b", "c", "d", "e", "f", "g", "h", "i", "j"},
+        ColumnType.STRING
+    ));
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    ComposingProcessor processor = new ComposingProcessor(
+        new WindowFirstProcessor("intCol", "FirstIntCol"),
+        new WindowFirstProcessor("doubleCol", "FirstDoubleCol"),
+        new WindowFirstProcessor("objectCol", "FirstObjectCol"),
+        new WindowFirstProcessor("nullFirstCol", "NullFirstCol")
+    );
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("intCol", new int[]{88, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("doubleCol", new double[]{0.4728, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("FirstIntCol", new int[]{88, 88, 88, 88, 88, 88, 88, 88, 88, 88})
+        .expectColumn(
+            "FirstDoubleCol",
+            new double[]{0.4728, 0.4728, 0.4728, 0.4728, 0.4728, 0.4728, 0.4728, 0.4728, 0.4728, 0.4728}
+        );
+
+    expectations.columnHelper("FirstObjectCol", 10, ColumnType.STRING)
+                .setExpectation(new String[]{"a", "a", "a", "a", "a", "a", "a", "a", "a", "a"});
+
+    expectations.columnHelper("NullFirstCol", 10, ColumnType.STRING)
+                .setNulls(new int[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9});
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowLagProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowLagProcessorTest.java
new file mode 100644
index 000000000000..3079a6acea80
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowLagProcessorTest.java
@@ -0,0 +1,77 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.value;
+
+import org.apache.druid.query.operator.window.ComposingProcessor;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.DoubleArrayColumn;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.column.ObjectArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.apache.druid.segment.column.ColumnType;
+import org.junit.Test;
+
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowLagProcessorTest
+{
+  @Test
+  public void testLagProcessing()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("intCol", new IntArrayColumn(new int[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("doubleCol", new DoubleArrayColumn(new double[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("objectCol", new ObjectArrayColumn(
+                new String[]{"a", "b", "c", "d", "e", "f", "g", "h", "i", "j"},
+                ColumnType.STRING
+            )
+    );
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    ComposingProcessor processor = new ComposingProcessor(
+        new WindowOffsetProcessor("intCol", "laggardIntCol", -2),
+        new WindowOffsetProcessor("doubleCol", "laggardDoubleCol", -4),
+        new WindowOffsetProcessor("objectCol", "laggardObjectCol", -1)
+    );
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("intCol", new int[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("doubleCol", new double[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9});
+
+    expectations.columnHelper("laggardIntCol", 10, ColumnType.LONG)
+                .setExpectation(new int[]{0, 0, 0, 1, 2, 3, 4, 5, 6, 7})
+                .setNulls(new int[]{0, 1});
+
+    expectations.columnHelper("laggardDoubleCol", 10, ColumnType.DOUBLE)
+                .setExpectation(new double[]{0, 0, 0, 0, 0, 1, 2, 3, 4, 5})
+                .setNulls(new int[]{0, 1, 2, 3});
+
+    expectations.columnHelper("laggardObjectCol", 10, ColumnType.STRING)
+                .setExpectation(new String[]{null, "a", "b", "c", "d", "e", "f", "g", "h", "i"})
+                .setNulls(new int[]{0});
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowLastProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowLastProcessorTest.java
new file mode 100644
index 000000000000..2e6aabba4971
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowLastProcessorTest.java
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.value;
+
+import org.apache.druid.query.operator.window.ComposingProcessor;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.DoubleArrayColumn;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.column.ObjectArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.apache.druid.segment.column.ColumnType;
+import org.junit.Test;
+
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowLastProcessorTest
+{
+  @Test
+  public void testLastProcessing()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("intCol", new IntArrayColumn(new int[]{88, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("doubleCol", new DoubleArrayColumn(new double[]{0.4728, 1, 2, 3, 4, 5, 6, 7, 8, 9.84}));
+    map.put("objectCol", new ObjectArrayColumn(
+        new String[]{"a", "b", "c", "d", "e", "f", "g", "h", "i", "j"},
+        ColumnType.STRING
+    ));
+    map.put("nullLastCol", new ObjectArrayColumn(
+        new String[]{null, "b", "c", "d", "e", "f", "g", "h", "i", null},
+        ColumnType.STRING
+    ));
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    ComposingProcessor processor = new ComposingProcessor(
+        new WindowLastProcessor("intCol", "LastIntCol"),
+        new WindowLastProcessor("doubleCol", "LastDoubleCol"),
+        new WindowLastProcessor("objectCol", "LastObjectCol"),
+        new WindowLastProcessor("nullLastCol", "NullLastCol")
+    );
+
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("intCol", new int[]{88, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("doubleCol", new double[]{0.4728, 1, 2, 3, 4, 5, 6, 7, 8, 9.84})
+        .expectColumn("LastIntCol", new int[]{9, 9, 9, 9, 9, 9, 9, 9, 9, 9})
+        .expectColumn("LastDoubleCol", new double[]{9.84, 9.84, 9.84, 9.84, 9.84, 9.84, 9.84, 9.84, 9.84, 9.84});
+
+    expectations.columnHelper("LastObjectCol", 10, ColumnType.STRING)
+                .setExpectation(new String[]{"j", "j", "j", "j", "j", "j", "j", "j", "j", "j"});
+
+    expectations.columnHelper("NullLastCol", 10, ColumnType.STRING)
+                .setNulls(new int[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9});
+
+    final RowsAndColumns results = processor.process(rac);
+    expectations.validate(results);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowLeadProcessorTest.java b/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowLeadProcessorTest.java
new file mode 100644
index 000000000000..fac4bf5e081d
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/operator/window/value/WindowLeadProcessorTest.java
@@ -0,0 +1,76 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.operator.window.value;
+
+import org.apache.druid.query.operator.window.ComposingProcessor;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.RowsAndColumns;
+import org.apache.druid.query.rowsandcols.column.Column;
+import org.apache.druid.query.rowsandcols.column.DoubleArrayColumn;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.column.ObjectArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.apache.druid.segment.column.ColumnType;
+import org.junit.Test;
+
+import java.util.LinkedHashMap;
+import java.util.Map;
+
+public class WindowLeadProcessorTest
+{
+  @Test
+  public void testLeadProcessing()
+  {
+    Map<String, Column> map = new LinkedHashMap<>();
+    map.put("intCol", new IntArrayColumn(new int[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("doubleCol", new DoubleArrayColumn(new double[]{0, 1, 2, 3, 4, 5, 6, 7, 8, 9}));
+    map.put("objectCol", new ObjectArrayColumn(
+                new String[]{"a", "b", "c", "d", "e", "f", "g", "h", "i", "j"},
+                ColumnType.STRING
+            )
+    );
+
+    MapOfColumnsRowsAndColumns rac = MapOfColumnsRowsAndColumns.fromMap(map);
+
+    ComposingProcessor processor = new ComposingProcessor(
+        new WindowOffsetProcessor("intCol", "LeadingIntCol", 2),
+        new WindowOffsetProcessor("doubleCol", "LeadingDoubleCol", 4),
+        new WindowOffsetProcessor("objectCol", "LeadingObjectCol", 1)
+    );
+
+    final RowsAndColumns results = processor.process(rac);
+
+    final RowsAndColumnsHelper expectations = new RowsAndColumnsHelper()
+        .expectColumn("intCol", new int[]{88, 1, 2, 3, 4, 5, 6, 7, 8, 9})
+        .expectColumn("doubleCol", new double[]{0.4728, 1, 2, 3, 4, 5, 6, 7, 8, 9});
+
+    expectations.columnHelper("LeadingIntCol", 10, ColumnType.LONG)
+                .setExpectation(new int[]{2, 3, 4, 5, 6, 7, 8, 9, 0, 0})
+                .setNulls(new int[]{8, 9});
+
+    expectations.columnHelper("LeadingDoubleCol", 10, ColumnType.DOUBLE)
+                .setExpectation(new double[]{4, 5, 6, 7, 8, 9, 0, 0, 0, 0})
+                .setNulls(new int[]{6, 7, 8, 9});
+
+    expectations.columnHelper("LeadingObjectCol", 10, ColumnType.STRING)
+                .setExpectation(new String[]{"b", "c", "d", "e", "f", "g", "h", "i", "j", null})
+                .setNulls(new int[]{9});
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumnsTest.java b/processing/src/test/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumnsTest.java
new file mode 100644
index 000000000000..9d2d18870f5a
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/rowsandcols/ArrayListRowsAndColumnsTest.java
@@ -0,0 +1,66 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.rowsandcols.column.ColumnAccessor;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.apache.druid.segment.column.RowSignature;
+
+import java.util.ArrayList;
+
+public class ArrayListRowsAndColumnsTest extends RowsAndColumnsTestBase<ArrayListRowsAndColumns<Object[]>>
+{
+
+  @Override
+  public ArrayListRowsAndColumns<Object[]> makeRowsAndColumns(MapOfColumnsRowsAndColumns input)
+  {
+    ArrayList<Object[]> rows = new ArrayList<>(input.numRows());
+
+    ArrayList<String> cols = new ArrayList<>(input.getColumnNames());
+    final RowSignature.Builder sigBob = RowSignature.builder();
+
+    for (int i = 0; i < input.numRows(); ++i) {
+      rows.add(new Object[cols.size()]);
+    }
+
+    for (int colIndex = 0; colIndex < cols.size(); ++colIndex) {
+      String col = cols.get(colIndex);
+      final ColumnAccessor column = input.findColumn(col).toAccessor();
+      sigBob.add(col, column.getType());
+
+      for (int i = 0; i < column.numRows(); ++i) {
+        rows.get(i)[colIndex] = column.getObject(i);
+      }
+    }
+
+    return new ArrayListRowsAndColumns<>(
+        rows,
+        columnName -> {
+          final int i = cols.indexOf(columnName);
+          if (i < 0) {
+            throw new ISE("Couldn't find column[%s]!? i[%s]", columnName, i);
+          }
+          return objects -> objects[i];
+        },
+        sigBob.build()
+    );
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/rowsandcols/MapOfColumnsRowsAndColumnsTest.java b/processing/src/test/java/org/apache/druid/query/rowsandcols/MapOfColumnsRowsAndColumnsTest.java
new file mode 100644
index 000000000000..4e85c152f853
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/rowsandcols/MapOfColumnsRowsAndColumnsTest.java
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.Collections;
+
+public class MapOfColumnsRowsAndColumnsTest extends RowsAndColumnsTestBase<MapOfColumnsRowsAndColumns>
+{
+  @Override
+  public MapOfColumnsRowsAndColumns makeRowsAndColumns(MapOfColumnsRowsAndColumns input)
+  {
+    return input;
+  }
+
+  @Test
+  public void testMakeWithEmptyAndNull()
+  {
+    boolean exceptionThrown = false;
+    try {
+      MapOfColumnsRowsAndColumns.fromMap(null);
+    }
+    catch (ISE ex) {
+      Assert.assertEquals("map[null] cannot be null or empty.", ex.getMessage());
+      exceptionThrown = true;
+    }
+    Assert.assertTrue(exceptionThrown);
+
+    exceptionThrown = false;
+    try {
+      MapOfColumnsRowsAndColumns.fromMap(Collections.emptyMap());
+    }
+    catch (ISE ex) {
+      Assert.assertEquals("map[{}] cannot be null or empty.", ex.getMessage());
+      exceptionThrown = true;
+    }
+    Assert.assertTrue(exceptionThrown);
+  }
+
+  @Test
+  public void testExceptionOnMismatchedCells()
+  {
+    boolean exceptionThrown = false;
+    try {
+      MapOfColumnsRowsAndColumns.of(
+          "1", new IntArrayColumn(new int[]{0}),
+          "2", new IntArrayColumn(new int[]{0, 1})
+      );
+    }
+    catch (ISE ex) {
+      Assert.assertEquals("Mismatched numCells, expectedNumCells[1], actual[2] from col[2].", ex.getMessage());
+      exceptionThrown = true;
+    }
+    Assert.assertTrue(exceptionThrown);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/rowsandcols/RowsAndColumnsTestBase.java b/processing/src/test/java/org/apache/druid/query/rowsandcols/RowsAndColumnsTestBase.java
new file mode 100644
index 000000000000..d0a4c30f0e6e
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/rowsandcols/RowsAndColumnsTestBase.java
@@ -0,0 +1,188 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols;
+
+import com.google.common.collect.ImmutableMap;
+import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.aggregation.LongMaxAggregatorFactory;
+import org.apache.druid.query.aggregation.LongMinAggregatorFactory;
+import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
+import org.apache.druid.query.operator.window.RowsAndColumnsHelper;
+import org.apache.druid.query.rowsandcols.column.IntArrayColumn;
+import org.apache.druid.query.rowsandcols.frame.AppendableMapOfColumns;
+import org.apache.druid.query.rowsandcols.frame.MapOfColumnsRowsAndColumns;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.Iterator;
+import java.util.List;
+
+/**
+ * This base class is intended to serve as a common set of tests to validate specific RowsAndColumns implementations.
+ * <p>
+ * Different RowsAndColumns implementations will implement different of the semantic interfaces, this base class should
+ * test all of the possible semantic interfaces that can be implemented.  By doing it this way, we can ensure that
+ * new RowsAndColumns implementations meet all of the corners cases and other issues that have been previously found.
+ * <p>
+ * It is expected that this base class is going to grow quite large.  As it gets extra large, we could perhaps look
+ * into whether one of the JUnit test runners could allow us to further sub-divide the test functionality into
+ * semantic-interface-specific tests.  The ultimate goal, however, should be that a new RowsAndColumns implementation
+ * can very simply take advantage of all of the tests by implementing the abstract
+ * {@link #makeRowsAndColumns(MapOfColumnsRowsAndColumns)} method and be done.
+ *
+ * @param <T>
+ */
+public abstract class RowsAndColumnsTestBase<T extends RowsAndColumns>
+{
+  static {
+    NullHandling.initializeForTests();
+  }
+
+  public abstract T makeRowsAndColumns(MapOfColumnsRowsAndColumns input);
+
+  @Test
+  public void testDefaultSortedGroupPartitioner()
+  {
+    T rac = makeRowsAndColumns(MapOfColumnsRowsAndColumns.fromMap(
+        ImmutableMap.of(
+            "sorted", new IntArrayColumn(new int[]{0, 0, 0, 1, 1, 2, 4, 4, 4}),
+            "unsorted", new IntArrayColumn(new int[]{3, 54, 21, 1, 5, 54, 2, 3, 92})
+        )
+    ));
+
+    validateSortedGroupPartitioner("default", new DefaultSortedGroupPartitioner(rac));
+
+    SortedGroupPartitioner specialized = rac.as(SortedGroupPartitioner.class);
+    if (specialized != null) {
+      validateSortedGroupPartitioner("specialized", specialized);
+    }
+  }
+
+  private void validateSortedGroupPartitioner(String name, SortedGroupPartitioner parter)
+  {
+
+    int[] expectedBounds = new int[]{0, 3, 5, 6, 9};
+
+    List<RowsAndColumnsHelper> expectations = Arrays.asList(
+        new RowsAndColumnsHelper()
+            .expectColumn("sorted", new int[]{0, 0, 0})
+            .expectColumn("unsorted", new int[]{3, 54, 21})
+            .allColumnsRegistered(),
+        new RowsAndColumnsHelper()
+            .expectColumn("sorted", new int[]{1, 1})
+            .expectColumn("unsorted", new int[]{1, 5})
+            .allColumnsRegistered(),
+        new RowsAndColumnsHelper()
+            .expectColumn("sorted", new int[]{2})
+            .expectColumn("unsorted", new int[]{54})
+            .allColumnsRegistered(),
+        new RowsAndColumnsHelper()
+            .expectColumn("sorted", new int[]{4, 4, 4})
+            .expectColumn("unsorted", new int[]{2, 3, 92})
+            .allColumnsRegistered()
+    );
+
+    final List<String> partCols = Collections.singletonList("sorted");
+    Assert.assertArrayEquals(name, expectedBounds, parter.computeBoundaries(partCols));
+
+    final Iterator<RowsAndColumns> partedChunks = parter.partitionOnBoundaries(partCols).iterator();
+    for (RowsAndColumnsHelper expectation : expectations) {
+      Assert.assertTrue(name, partedChunks.hasNext());
+      expectation.validate(name, partedChunks.next());
+    }
+    Assert.assertFalse(name, partedChunks.hasNext());
+
+    boolean exceptionThrown = false;
+    try {
+      parter.partitionOnBoundaries(Collections.singletonList("unsorted"));
+    }
+    catch (ISE ex) {
+      Assert.assertEquals("Pre-sorted data required, rows[1] and [2] were not in order", ex.getMessage());
+      exceptionThrown = true;
+    }
+    Assert.assertTrue(exceptionThrown);
+  }
+
+  @Test
+  public void testOnHeapAggregatable()
+  {
+    T rac = makeRowsAndColumns(MapOfColumnsRowsAndColumns.fromMap(
+        ImmutableMap.of(
+            "incremented", new IntArrayColumn(new int[]{1, 2, 3, 4, 5, 6, 7, 8, 9, 10}),
+            "zeroesOut", new IntArrayColumn(new int[]{4, -4, 3, -3, 4, 82, -90, 4, 0, 0})
+        )
+    ));
+
+    validateOnHeapAggregatable("default", new DefaultOnHeapAggregatable(rac));
+
+    OnHeapAggregatable specialized = rac.as(OnHeapAggregatable.class);
+    if (specialized != null) {
+      validateOnHeapAggregatable("specialized", specialized);
+    }
+  }
+
+  private void validateOnHeapAggregatable(String name, OnHeapAggregatable agger)
+  {
+    final ArrayList<Object> results = agger.aggregateAll(Arrays.asList(
+        new LongSumAggregatorFactory("incremented", "incremented"),
+        new LongMaxAggregatorFactory("zeroesOutMax", "zeroesOut"),
+        new LongMinAggregatorFactory("zeroesOutMin", "zeroesOut")
+    ));
+
+    Assert.assertEquals(name, 3, results.size());
+    Assert.assertEquals(name, 55L, results.get(0));
+    Assert.assertEquals(name, 82L, results.get(1));
+    Assert.assertEquals(name, -90L, results.get(2));
+  }
+
+  @Test
+  public void testAppendableRowsAndColumns()
+  {
+    T rac = makeRowsAndColumns(MapOfColumnsRowsAndColumns.fromMap(
+        ImmutableMap.of(
+            "colA", new IntArrayColumn(new int[]{1, 2, 3, 4, 5, 6, 7, 8, 9, 10}),
+            "colB", new IntArrayColumn(new int[]{4, -4, 3, -3, 4, 82, -90, 4, 0, 0})
+        )
+    ));
+
+    validateAppendableRowsAndColumns("default", new AppendableMapOfColumns(rac));
+
+    AppendableRowsAndColumns specialized = rac.as(AppendableRowsAndColumns.class);
+    if (specialized != null) {
+      validateAppendableRowsAndColumns("specialized", specialized);
+    }
+  }
+
+  public void validateAppendableRowsAndColumns(String name, AppendableRowsAndColumns appender)
+  {
+    appender.addColumn("newCol", new IntArrayColumn(new int[]{1, 2, 3, 4, 5, 6, 7, 8, 9, 10}));
+
+    new RowsAndColumnsHelper()
+        .expectColumn("colA", new int[]{1, 2, 3, 4, 5, 6, 7, 8, 9, 10})
+        .expectColumn("colB", new int[]{4, -4, 3, -3, 4, 82, -90, 4, 0, 0})
+        .expectColumn("newCol", new int[]{1, 2, 3, 4, 5, 6, 7, 8, 9, 10})
+        .allColumnsRegistered()
+        .validate(name, appender);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/rowsandcols/column/NullColumnAccessorTest.java b/processing/src/test/java/org/apache/druid/query/rowsandcols/column/NullColumnAccessorTest.java
new file mode 100644
index 000000000000..89c286165dc8
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/query/rowsandcols/column/NullColumnAccessorTest.java
@@ -0,0 +1,46 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.query.rowsandcols.column;
+
+import org.junit.Assert;
+import org.junit.Test;
+
+public class NullColumnAccessorTest
+{
+
+  @Test
+  public void testSanity()
+  {
+    NullColumnAccessor accessor = new NullColumnAccessor(10);
+    Assert.assertEquals(10, accessor.numRows());
+
+    for (int i = 0; i < 10; ++i) {
+      Assert.assertTrue(accessor.isNull(i));
+      Assert.assertNull(accessor.getObject(i));
+      Assert.assertEquals(0, accessor.getInt(i));
+      Assert.assertEquals(0, accessor.getLong(i));
+      Assert.assertEquals(0.0, accessor.getFloat(i), 0);
+      Assert.assertEquals(0.0, accessor.getDouble(i), 0);
+      for (int j = 0; j < i; ++j) {
+        Assert.assertEquals(0, accessor.compareCells(j, i));
+      }
+    }
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/query/scan/ScanQueryRunnerTest.java b/processing/src/test/java/org/apache/druid/query/scan/ScanQueryRunnerTest.java
index 31a7a454f374..4840a1ccfd18 100644
--- a/processing/src/test/java/org/apache/druid/query/scan/ScanQueryRunnerTest.java
+++ b/processing/src/test/java/org/apache/druid/query/scan/ScanQueryRunnerTest.java
@@ -230,8 +230,7 @@ public void testFullOnSelect()
         0,
         3
     );
-    Assert.assertEquals(1, stubServiceEmitter.getEvents().size());
-    Assert.assertEquals(false, stubServiceEmitter.getEvents().get(0).toMap().getOrDefault("vectorized", null));
+    stubServiceEmitter.verifyEmitted("query/wait/time", ImmutableMap.of("vectorized", false), 1);
     verify(expectedResults, populateNullColumnAtLastForQueryableIndexCase(results, "null_column"));
   }
 
diff --git a/processing/src/test/java/org/apache/druid/query/timeseries/TimeseriesQueryRunnerTest.java b/processing/src/test/java/org/apache/druid/query/timeseries/TimeseriesQueryRunnerTest.java
index 74155ce51c54..d9d73e67effb 100644
--- a/processing/src/test/java/org/apache/druid/query/timeseries/TimeseriesQueryRunnerTest.java
+++ b/processing/src/test/java/org/apache/druid/query/timeseries/TimeseriesQueryRunnerTest.java
@@ -317,11 +317,7 @@ public void testFullOnTimeseries()
       ++count;
     }
 
-    Assert.assertEquals(1, stubServiceEmitter.getEvents().size());
-    Assert.assertEquals(
-        vectorize,
-        stubServiceEmitter.getEvents().get(0).toMap().getOrDefault("vectorized", null)
-    );
+    stubServiceEmitter.verifyEmitted("query/wait/time", ImmutableMap.of("vectorized", vectorize), 1);
     Assert.assertEquals(lastResult.toString(), expectedLast, lastResult.getTimestamp());
   }
 
diff --git a/processing/src/test/java/org/apache/druid/segment/ListCursor.java b/processing/src/test/java/org/apache/druid/segment/ListCursor.java
new file mode 100644
index 000000000000..666bc21be5bb
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/segment/ListCursor.java
@@ -0,0 +1,228 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment;
+
+import com.google.common.base.Predicate;
+import org.apache.druid.query.BaseQuery;
+import org.apache.druid.query.dimension.DimensionSpec;
+import org.apache.druid.query.filter.ValueMatcher;
+import org.apache.druid.query.monomorphicprocessing.RuntimeShapeInspector;
+import org.apache.druid.segment.column.ColumnCapabilities;
+import org.apache.druid.segment.data.IndexedInts;
+import org.joda.time.DateTime;
+
+import javax.annotation.Nullable;
+import java.util.List;
+
+
+/**
+ * A Cursor that iterates over a user created list.
+ * This is used to test the base cursor of an UnnestCursor.
+ * Usages can be found in tests of {@link UnnestColumnValueSelectorCursor} in {@link UnnestColumnValueSelectorCursorTest}
+ * However this cannot help with {@link UnnestDimensionCursor}.
+ * Tests for {@link UnnestDimensionCursor} are done alongside tests for {@link UnnestStorageAdapterTest}
+ */
+public class ListCursor implements Cursor
+{
+  List<Object> baseList;
+  private int index;
+
+  public ListCursor(List<Object> inputList)
+  {
+    this.baseList = inputList;
+  }
+
+  @Override
+  public ColumnSelectorFactory getColumnSelectorFactory()
+  {
+    return new ColumnSelectorFactory()
+    {
+      @Override
+      public DimensionSelector makeDimensionSelector(DimensionSpec dimensionSpec)
+      {
+        return new DimensionSelector()
+        {
+          @Override
+          public IndexedInts getRow()
+          {
+            return null;
+          }
+
+          @Override
+          public ValueMatcher makeValueMatcher(@Nullable String value)
+          {
+            return null;
+          }
+
+          @Override
+          public ValueMatcher makeValueMatcher(Predicate<String> predicate)
+          {
+            return null;
+          }
+
+          @Override
+          public void inspectRuntimeShape(RuntimeShapeInspector inspector)
+          {
+
+          }
+
+          @Nullable
+          @Override
+          public Object getObject()
+          {
+            if (index < baseList.size()) {
+              return baseList.get(index);
+            }
+            return null;
+          }
+
+          @Override
+          public Class<?> classOfObject()
+          {
+            return null;
+          }
+
+          @Override
+          public int getValueCardinality()
+          {
+            return 0;
+          }
+
+          @Nullable
+          @Override
+          public String lookupName(int id)
+          {
+            return null;
+          }
+
+          @Override
+          public boolean nameLookupPossibleInAdvance()
+          {
+            return false;
+          }
+
+          @Nullable
+          @Override
+          public IdLookup idLookup()
+          {
+            return null;
+          }
+        };
+      }
+
+      @Override
+      public ColumnValueSelector makeColumnValueSelector(String columnName)
+      {
+        return new ColumnValueSelector()
+        {
+          @Override
+          public double getDouble()
+          {
+            return 0;
+          }
+
+          @Override
+          public float getFloat()
+          {
+            return 0;
+          }
+
+          @Override
+          public long getLong()
+          {
+            return 0;
+          }
+
+          @Override
+          public void inspectRuntimeShape(RuntimeShapeInspector inspector)
+          {
+
+          }
+
+          @Override
+          public boolean isNull()
+          {
+            return false;
+          }
+
+          @Nullable
+          @Override
+          public Object getObject()
+          {
+            if (index < baseList.size()) {
+              return baseList.get(index);
+            }
+            return null;
+          }
+
+          @Override
+          public Class classOfObject()
+          {
+            return null;
+          }
+        };
+      }
+
+      @Nullable
+      @Override
+      public ColumnCapabilities getColumnCapabilities(String column)
+      {
+        return null;
+      }
+    };
+  }
+
+  @Override
+  public DateTime getTime()
+  {
+    return null;
+  }
+
+  @Override
+  public void advance()
+  {
+    advanceUninterruptibly();
+    BaseQuery.checkInterrupted();
+  }
+
+  @Override
+  public void advanceUninterruptibly()
+  {
+    index++;
+  }
+
+  @Override
+  public boolean isDone()
+  {
+    return index > baseList.size() - 1;
+  }
+
+  @Override
+  public boolean isDoneOrInterrupted()
+  {
+    return false;
+  }
+
+  @Override
+  public void reset()
+  {
+    index = 0;
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/segment/UnnestColumnValueSelectorCursorTest.java b/processing/src/test/java/org/apache/druid/segment/UnnestColumnValueSelectorCursorTest.java
new file mode 100644
index 000000000000..b3346e1e5623
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/segment/UnnestColumnValueSelectorCursorTest.java
@@ -0,0 +1,632 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment;
+
+import org.apache.druid.java.util.common.UOE;
+import org.apache.druid.query.dimension.DefaultDimensionSpec;
+import org.apache.druid.testing.InitializedNullHandlingTest;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.LinkedHashSet;
+import java.util.List;
+
+public class UnnestColumnValueSelectorCursorTest extends InitializedNullHandlingTest
+{
+  private static String OUTPUT_NAME = "unnested-column";
+  private static LinkedHashSet<String> IGNORE_SET = null;
+  private static LinkedHashSet<String> IGNORE_SET1 = new LinkedHashSet<>(Arrays.asList("b", "f"));
+
+
+  @Test
+  public void test_list_unnest_cursors()
+  {
+    ArrayList<Object> baseList = new ArrayList<>();
+    for (int i = 0; i < 2; i++) {
+      List<Object> newList = new ArrayList<>();
+      for (int j = 0; j < 2; j++) {
+        newList.add(String.valueOf(i * 2 + j));
+      }
+      baseList.add(newList);
+    }
+    ListCursor listCursor = new ListCursor(baseList);
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int j = 0;
+    while (!unnestCursor.isDone()) {
+      Object colSelectorVal = unnestColumnValueSelector.getObject();
+      Assert.assertEquals(colSelectorVal.toString(), String.valueOf(j));
+      j++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(j, 4);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList("a", "b", "c"),
+        Arrays.asList("e", "f", "g", "h", "i"),
+        Collections.singletonList("j")
+    );
+
+    List<String> expectedResults = Arrays.asList("a", "b", "c", "e", "f", "g", "h", "i", "j");
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k));
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 9);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_only_nulls()
+  {
+    List<Object> inputList = Arrays.asList(
+        Collections.singletonList(null),
+        Arrays.asList(null, null),
+        Collections.singletonList(null)
+    );
+
+    List<String> expectedResults = Arrays.asList(null, null, null, null);
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      Assert.assertNull(valueSelectorVal);
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 4);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_mixed_with_nulls()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList("a", "b"),
+        Arrays.asList("b", "c"),
+        "d",
+        null,
+        null,
+        null
+    );
+
+    List<String> expectedResults = Arrays.asList("a", "b", "b", "c", "d", null, null, null);
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      if (valueSelectorVal == null) {
+        Assert.assertEquals(null, expectedResults.get(k));
+      } else {
+        Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k));
+      }
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 8);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_strings_and_no_lists()
+  {
+    List<Object> inputList = Arrays.asList("a", "b", "c", "e", "f", "g", "h", "i", "j");
+
+    List<String> expectedResults = Arrays.asList("a", "b", "c", "e", "f", "g", "h", "i", "j");
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k));
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 9);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_strings_mixed_with_list()
+  {
+    List<Object> inputList = Arrays.asList("a", "b", "c", "e", "f", Arrays.asList("g", "h"), "i", "j");
+
+    List<String> expectedResults = Arrays.asList("a", "b", "c", "e", "f", "g", "h", "i", "j");
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k));
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 9);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_lists_three_levels()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList("a", "b", "c"),
+        Arrays.asList("e", "f", "g", "h", "i"),
+        Arrays.asList("j", Arrays.asList("a", "b"))
+    );
+
+    List<Object> expectedResults = Arrays.asList("a", "b", "c", "e", "f", "g", "h", "i", "j", Arrays.asList("a", "b"));
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k).toString());
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 10);
+  }
+
+  @Test
+  public void test_list_unnest_of_unnest_cursors_user_supplied_list_three_levels()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList("a", "b", "c"),
+        Arrays.asList("e", "f", "g", "h", "i"),
+        Arrays.asList("j", Arrays.asList("a", "b"))
+    );
+
+    List<Object> expectedResults = Arrays.asList("a", "b", "c", "e", "f", "g", "h", "i", "j", "a", "b");
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor childCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    UnnestColumnValueSelectorCursor parentCursor = new UnnestColumnValueSelectorCursor(
+        childCursor,
+        childCursor.getColumnSelectorFactory(),
+        OUTPUT_NAME,
+        "tmp-out",
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = parentCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector("tmp-out");
+    int k = 0;
+    while (!parentCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k).toString());
+      k++;
+      parentCursor.advance();
+    }
+    Assert.assertEquals(k, 11);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_with_nulls()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList("a", "b", "c"),
+        Arrays.asList("e", "f", "g", "h", "i", null),
+        Collections.singletonList("j")
+    );
+
+    List<Object> expectedResults = Arrays.asList("a", "b", "c", "e", "f", "g", "h", "i", null, "j");
+
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      if (valueSelectorVal == null) {
+        Assert.assertEquals(null, expectedResults.get(k));
+      } else {
+        Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k));
+      }
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, expectedResults.size());
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_with_dups()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList("a", "a", "a"),
+        Arrays.asList("e", "f", null, "h", "i", null),
+        Collections.singletonList("j")
+    );
+
+    List<Object> expectedResults = Arrays.asList("a", "a", "a", "e", "f", null, "h", "i", null, "j");
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      if (valueSelectorVal == null) {
+        Assert.assertEquals(null, expectedResults.get(k));
+      } else {
+        Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k));
+      }
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 10);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_with_ignore_set()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList("a", "b", "c"),
+        Arrays.asList("e", "f", "g", "h", "i"),
+        Collections.singletonList("j")
+    );
+
+    List<String> expectedResults = Arrays.asList("b", "f");
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET1
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      if (valueSelectorVal == null) {
+        Assert.assertEquals(null, expectedResults.get(k));
+      } else {
+        Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k));
+      }
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 2);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_double()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList(1, 2, 3),
+        Arrays.asList(4, 5, 6, 7, 8),
+        Collections.singletonList(9)
+    );
+
+    List<Double> expectedResults = Arrays.asList(1d, 2d, 3d, 4d, 5d, 6d, 7d, 8d, 9d);
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Double valueSelectorVal = unnestColumnValueSelector.getDouble();
+      Assert.assertEquals(valueSelectorVal, expectedResults.get(k));
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 9);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_float()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList(1, 2, 3),
+        Arrays.asList(4, 5, 6, 7, 8),
+        Collections.singletonList(9)
+    );
+
+    List<Float> expectedResults = Arrays.asList(1f, 2f, 3f, 4f, 5f, 6f, 7f, 8f, 9f);
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Float valueSelectorVal = unnestColumnValueSelector.getFloat();
+      Assert.assertEquals(valueSelectorVal, expectedResults.get(k));
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 9);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_long()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList(1, 2, 3),
+        Arrays.asList(4, 5, 6, 7, 8),
+        Collections.singletonList(9)
+    );
+
+    List<Long> expectedResults = Arrays.asList(1L, 2L, 3L, 4L, 5L, 6L, 7L, 8L, 9L);
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object obj = unnestColumnValueSelector.getObject();
+      Assert.assertNotNull(obj);
+      Long valueSelectorVal = unnestColumnValueSelector.getLong();
+      Assert.assertEquals(valueSelectorVal, expectedResults.get(k));
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 9);
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_three_level_arrays_and_methods()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList("a", "b", "c"),
+        Arrays.asList("e", "f", "g", "h", "i"),
+        Arrays.asList("j", Arrays.asList("a", "b"))
+    );
+
+    List<Object> expectedResults = Arrays.asList("a", "b", "c", "e", "f", "g", "h", "i", "j", Arrays.asList("a", "b"));
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k).toString());
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 10);
+    unnestCursor.reset();
+    Assert.assertFalse(unnestCursor.isDoneOrInterrupted());
+  }
+
+  @Test(expected = UOE.class)
+  public void test_list_unnest_cursors_dimSelector()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList("a", "b", "c"),
+        Arrays.asList("e", "f", "g", "h", "i"),
+        Collections.singletonList("j")
+    );
+
+    List<String> expectedResults = Arrays.asList("a", "b", "c", "e", "f", "g", "h", "i", "j");
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    unnestCursor.getColumnSelectorFactory().makeDimensionSelector(DefaultDimensionSpec.of(OUTPUT_NAME));
+  }
+
+  @Test
+  public void test_list_unnest_cursors_user_supplied_list_of_integers()
+  {
+    List<Object> inputList = Arrays.asList(
+        Arrays.asList(1, 2, 3),
+        Arrays.asList(4, 5, 6, 7, 8),
+        Collections.singletonList(9)
+    );
+
+    List<Integer> expectedResults = Arrays.asList(1, 2, 3, 4, 5, 6, 7, 8, 9);
+
+    //Create base cursor
+    ListCursor listCursor = new ListCursor(inputList);
+
+    //Create unnest cursor
+    UnnestColumnValueSelectorCursor unnestCursor = new UnnestColumnValueSelectorCursor(
+        listCursor,
+        listCursor.getColumnSelectorFactory(),
+        "dummy",
+        OUTPUT_NAME,
+        IGNORE_SET
+    );
+    ColumnValueSelector unnestColumnValueSelector = unnestCursor.getColumnSelectorFactory()
+                                                                .makeColumnValueSelector(OUTPUT_NAME);
+    int k = 0;
+    while (!unnestCursor.isDone()) {
+      Object valueSelectorVal = unnestColumnValueSelector.getObject();
+      Assert.assertEquals(valueSelectorVal.toString(), expectedResults.get(k).toString());
+      k++;
+      unnestCursor.advance();
+    }
+    Assert.assertEquals(k, 9);
+  }
+}
+
diff --git a/processing/src/test/java/org/apache/druid/segment/UnnestStorageAdapterTest.java b/processing/src/test/java/org/apache/druid/segment/UnnestStorageAdapterTest.java
new file mode 100644
index 000000000000..35d42b82d4b3
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/segment/UnnestStorageAdapterTest.java
@@ -0,0 +1,399 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment;
+
+import com.google.common.collect.ImmutableList;
+import org.apache.druid.java.util.common.DateTimes;
+import org.apache.druid.java.util.common.granularity.Granularities;
+import org.apache.druid.java.util.common.guava.Sequence;
+import org.apache.druid.java.util.common.io.Closer;
+import org.apache.druid.query.dimension.DefaultDimensionSpec;
+import org.apache.druid.segment.column.ColumnCapabilities;
+import org.apache.druid.segment.column.ValueType;
+import org.apache.druid.segment.generator.GeneratorBasicSchemas;
+import org.apache.druid.segment.generator.GeneratorSchemaInfo;
+import org.apache.druid.segment.generator.SegmentGenerator;
+import org.apache.druid.segment.incremental.IncrementalIndex;
+import org.apache.druid.segment.incremental.IncrementalIndexStorageAdapter;
+import org.apache.druid.testing.InitializedNullHandlingTest;
+import org.apache.druid.timeline.DataSegment;
+import org.apache.druid.timeline.partition.LinearShardSpec;
+import org.apache.druid.utils.CloseableUtils;
+import org.junit.AfterClass;
+import org.junit.Assert;
+import org.junit.BeforeClass;
+import org.junit.Test;
+
+import java.util.Arrays;
+import java.util.LinkedHashSet;
+import java.util.List;
+
+public class UnnestStorageAdapterTest extends InitializedNullHandlingTest
+{
+  private static Closer CLOSER;
+  private static IncrementalIndex INCREMENTAL_INDEX;
+  private static IncrementalIndexStorageAdapter INCREMENTAL_INDEX_STORAGE_ADAPTER;
+  private static UnnestStorageAdapter UNNEST_STORAGE_ADAPTER;
+  private static UnnestStorageAdapter UNNEST_STORAGE_ADAPTER1;
+  private static UnnestStorageAdapter UNNEST_STORAGE_ADAPTER2;
+  private static UnnestStorageAdapter UNNEST_STORAGE_ADAPTER3;
+  private static List<StorageAdapter> ADAPTERS;
+  private static String COLUMNNAME = "multi-string1";
+  private static String OUTPUT_COLUMN_NAME = "unnested-multi-string1";
+  private static String OUTPUT_COLUMN_NAME1 = "unnested-multi-string1-again";
+  private static LinkedHashSet<String> IGNORE_SET = new LinkedHashSet<>(Arrays.asList("1", "3", "5"));
+
+  @BeforeClass
+  public static void setup()
+  {
+    CLOSER = Closer.create();
+    final GeneratorSchemaInfo schemaInfo = GeneratorBasicSchemas.SCHEMA_MAP.get("expression-testbench");
+
+    final DataSegment dataSegment = DataSegment.builder()
+                                               .dataSource("foo")
+                                               .interval(schemaInfo.getDataInterval())
+                                               .version("1")
+                                               .shardSpec(new LinearShardSpec(0))
+                                               .size(0)
+                                               .build();
+    final SegmentGenerator segmentGenerator = CLOSER.register(new SegmentGenerator());
+
+    final int numRows = 2;
+    INCREMENTAL_INDEX = CLOSER.register(
+        segmentGenerator.generateIncrementalIndex(dataSegment, schemaInfo, Granularities.HOUR, numRows)
+    );
+    INCREMENTAL_INDEX_STORAGE_ADAPTER = new IncrementalIndexStorageAdapter(INCREMENTAL_INDEX);
+    UNNEST_STORAGE_ADAPTER = new UnnestStorageAdapter(
+        INCREMENTAL_INDEX_STORAGE_ADAPTER,
+        COLUMNNAME,
+        OUTPUT_COLUMN_NAME,
+        null
+    );
+    UNNEST_STORAGE_ADAPTER1 = new UnnestStorageAdapter(
+        INCREMENTAL_INDEX_STORAGE_ADAPTER,
+        COLUMNNAME,
+        OUTPUT_COLUMN_NAME,
+        IGNORE_SET
+    );
+    UNNEST_STORAGE_ADAPTER2 = new UnnestStorageAdapter(
+        UNNEST_STORAGE_ADAPTER,
+        COLUMNNAME,
+        OUTPUT_COLUMN_NAME1,
+        null
+    );
+    UNNEST_STORAGE_ADAPTER3 = new UnnestStorageAdapter(
+        UNNEST_STORAGE_ADAPTER1,
+        COLUMNNAME,
+        OUTPUT_COLUMN_NAME1,
+        IGNORE_SET
+    );
+    ADAPTERS = ImmutableList.of(
+        UNNEST_STORAGE_ADAPTER,
+        UNNEST_STORAGE_ADAPTER1,
+        UNNEST_STORAGE_ADAPTER2,
+        UNNEST_STORAGE_ADAPTER3
+    );
+  }
+
+  @AfterClass
+  public static void teardown()
+  {
+    CloseableUtils.closeAndSuppressExceptions(CLOSER, throwable -> {
+    });
+  }
+
+  @Test
+  public void test_group_of_unnest_adapters_methods()
+  {
+    String colName = "multi-string1";
+    for (StorageAdapter adapter : ADAPTERS) {
+      Assert.assertEquals(
+          DateTimes.of("2000-01-01T23:00:00.000Z"),
+          adapter.getMaxTime()
+      );
+      Assert.assertEquals(
+          DateTimes.of("2000-01-01T12:00:00.000Z"),
+          adapter.getMinTime()
+      );
+      adapter.getColumnCapabilities(colName);
+      Assert.assertEquals(adapter.getNumRows(), 0);
+      Assert.assertNotNull(adapter.getMetadata());
+      Assert.assertEquals(
+          DateTimes.of("2000-01-01T23:59:59.999Z"),
+          adapter.getMaxIngestedEventTime()
+      );
+      Assert.assertEquals(
+          adapter.getColumnCapabilities(colName).toColumnType(),
+          INCREMENTAL_INDEX_STORAGE_ADAPTER.getColumnCapabilities(colName).toColumnType()
+      );
+      Assert.assertEquals(((UnnestStorageAdapter) adapter).getDimensionToUnnest(), colName);
+    }
+  }
+
+  @Test
+  public void test_group_of_unnest_adapters_column_capabilities()
+  {
+    String colName = "multi-string1";
+    List<String> columnsInTable = Arrays.asList(
+        "string1",
+        "long1",
+        "double1",
+        "float1",
+        "multi-string1",
+        OUTPUT_COLUMN_NAME
+    );
+    List<ValueType> valueTypes = Arrays.asList(
+        ValueType.STRING,
+        ValueType.LONG,
+        ValueType.DOUBLE,
+        ValueType.FLOAT,
+        ValueType.STRING,
+        ValueType.STRING
+    );
+    UnnestStorageAdapter adapter = UNNEST_STORAGE_ADAPTER;
+
+    for (int i = 0; i < columnsInTable.size(); i++) {
+      ColumnCapabilities capabilities = adapter.getColumnCapabilities(columnsInTable.get(i));
+      Assert.assertEquals(capabilities.getType(), valueTypes.get(i));
+    }
+    Assert.assertEquals(adapter.getDimensionToUnnest(), colName);
+
+  }
+
+  @Test
+  public void test_unnest_adapters_basic()
+  {
+
+    Sequence<Cursor> cursorSequence = UNNEST_STORAGE_ADAPTER.makeCursors(
+        null,
+        UNNEST_STORAGE_ADAPTER.getInterval(),
+        VirtualColumns.EMPTY,
+        Granularities.ALL,
+        false,
+        null
+    );
+
+    cursorSequence.accumulate(null, (accumulated, cursor) -> {
+      ColumnSelectorFactory factory = cursor.getColumnSelectorFactory();
+
+      DimensionSelector dimSelector = factory.makeDimensionSelector(DefaultDimensionSpec.of(OUTPUT_COLUMN_NAME));
+      int count = 0;
+      while (!cursor.isDone()) {
+        Object dimSelectorVal = dimSelector.getObject();
+        if (dimSelectorVal == null) {
+          Assert.assertNull(dimSelectorVal);
+        }
+        cursor.advance();
+        count++;
+      }
+        /*
+      each row has 8 entries.
+      unnest 2 rows -> 16 rows after unnest
+       */
+      Assert.assertEquals(count, 16);
+      return null;
+    });
+
+  }
+
+  @Test
+  public void test_two_levels_of_unnest_adapters()
+  {
+    Sequence<Cursor> cursorSequence = UNNEST_STORAGE_ADAPTER2.makeCursors(
+        null,
+        UNNEST_STORAGE_ADAPTER2.getInterval(),
+        VirtualColumns.EMPTY,
+        Granularities.ALL,
+        false,
+        null
+    );
+
+
+    cursorSequence.accumulate(null, (accumulated, cursor) -> {
+      ColumnSelectorFactory factory = cursor.getColumnSelectorFactory();
+
+      DimensionSelector dimSelector = factory.makeDimensionSelector(DefaultDimensionSpec.of(OUTPUT_COLUMN_NAME1));
+      ColumnValueSelector valueSelector = factory.makeColumnValueSelector(OUTPUT_COLUMN_NAME1);
+
+      int count = 0;
+      while (!cursor.isDone()) {
+        Object dimSelectorVal = dimSelector.getObject();
+        Object valueSelectorVal = valueSelector.getObject();
+        if (dimSelectorVal == null) {
+          Assert.assertNull(dimSelectorVal);
+        } else if (valueSelectorVal == null) {
+          Assert.assertNull(valueSelectorVal);
+        }
+        cursor.advance();
+        count++;
+      }
+      /*
+      each row has 8 entries.
+      unnest 2 rows -> 16 entries also the value cardinality
+      unnest of unnest -> 16*8 = 128 rows
+       */
+      Assert.assertEquals(count, 128);
+      Assert.assertEquals(dimSelector.getValueCardinality(), 16);
+      return null;
+    });
+  }
+
+  @Test
+  public void test_unnest_adapters_with_allowList()
+  {
+    final String columnName = "multi-string1";
+
+    Sequence<Cursor> cursorSequence = UNNEST_STORAGE_ADAPTER1.makeCursors(
+        null,
+        UNNEST_STORAGE_ADAPTER1.getInterval(),
+        VirtualColumns.EMPTY,
+        Granularities.ALL,
+        false,
+        null
+    );
+
+    cursorSequence.accumulate(null, (accumulated, cursor) -> {
+      ColumnSelectorFactory factory = cursor.getColumnSelectorFactory();
+
+      DimensionSelector dimSelector = factory.makeDimensionSelector(DefaultDimensionSpec.of(OUTPUT_COLUMN_NAME));
+      ColumnValueSelector valueSelector = factory.makeColumnValueSelector(OUTPUT_COLUMN_NAME);
+
+      int count = 0;
+      while (!cursor.isDone()) {
+        Object dimSelectorVal = dimSelector.getObject();
+        Object valueSelectorVal = valueSelector.getObject();
+        if (dimSelectorVal == null) {
+          Assert.assertNull(dimSelectorVal);
+        } else if (valueSelectorVal == null) {
+          Assert.assertNull(valueSelectorVal);
+        }
+        cursor.advance();
+        count++;
+      }
+      /*
+      each row has 8 distinct entries.
+      allowlist has 3 entries also the value cardinality
+      unnest will have 3 distinct entries
+       */
+      Assert.assertEquals(count, 3);
+      Assert.assertEquals(dimSelector.getValueCardinality(), 3);
+      return null;
+    });
+  }
+
+  @Test
+  public void test_two_levels_of_unnest_adapters_with_allowList()
+  {
+    final String columnName = "multi-string1";
+
+    Sequence<Cursor> cursorSequence = UNNEST_STORAGE_ADAPTER3.makeCursors(
+        null,
+        UNNEST_STORAGE_ADAPTER3.getInterval(),
+        VirtualColumns.EMPTY,
+        Granularities.ALL,
+        false,
+        null
+    );
+    UnnestStorageAdapter adapter = UNNEST_STORAGE_ADAPTER3;
+    Assert.assertEquals(adapter.getDimensionToUnnest(), columnName);
+    Assert.assertEquals(
+        adapter.getColumnCapabilities(OUTPUT_COLUMN_NAME).isDictionaryEncoded(),
+        ColumnCapabilities.Capable.TRUE
+    );
+    Assert.assertEquals(adapter.getMaxValue(columnName), adapter.getMaxValue(OUTPUT_COLUMN_NAME));
+    Assert.assertEquals(adapter.getMinValue(columnName), adapter.getMinValue(OUTPUT_COLUMN_NAME));
+
+    cursorSequence.accumulate(null, (accumulated, cursor) -> {
+      ColumnSelectorFactory factory = cursor.getColumnSelectorFactory();
+
+      DimensionSelector dimSelector = factory.makeDimensionSelector(DefaultDimensionSpec.of(OUTPUT_COLUMN_NAME1));
+      ColumnValueSelector valueSelector = factory.makeColumnValueSelector(OUTPUT_COLUMN_NAME1);
+
+      int count = 0;
+      while (!cursor.isDone()) {
+        Object dimSelectorVal = dimSelector.getObject();
+        Object valueSelectorVal = valueSelector.getObject();
+        if (dimSelectorVal == null) {
+          Assert.assertNull(dimSelectorVal);
+        } else if (valueSelectorVal == null) {
+          Assert.assertNull(valueSelectorVal);
+        }
+        cursor.advance();
+        count++;
+      }
+      /*
+      each row has 8 distinct entries.
+      allowlist has 3 entries also the value cardinality
+      unnest will have 3 distinct entries
+      unnest of that unnest will have 3*3 = 9 entries
+       */
+      Assert.assertEquals(count, 9);
+      Assert.assertEquals(dimSelector.getValueCardinality(), 3);
+      return null;
+    });
+  }
+
+  @Test
+  public void test_unnest_adapters_methods_with_allowList()
+  {
+    final String columnName = "multi-string1";
+
+    Sequence<Cursor> cursorSequence = UNNEST_STORAGE_ADAPTER1.makeCursors(
+        null,
+        UNNEST_STORAGE_ADAPTER1.getInterval(),
+        VirtualColumns.EMPTY,
+        Granularities.ALL,
+        false,
+        null
+    );
+    UnnestStorageAdapter adapter = UNNEST_STORAGE_ADAPTER1;
+    Assert.assertEquals(adapter.getDimensionToUnnest(), columnName);
+    Assert.assertEquals(
+        adapter.getColumnCapabilities(OUTPUT_COLUMN_NAME).isDictionaryEncoded(),
+        ColumnCapabilities.Capable.TRUE
+    );
+    Assert.assertEquals(adapter.getMaxValue(columnName), adapter.getMaxValue(OUTPUT_COLUMN_NAME));
+    Assert.assertEquals(adapter.getMinValue(columnName), adapter.getMinValue(OUTPUT_COLUMN_NAME));
+
+    cursorSequence.accumulate(null, (accumulated, cursor) -> {
+      ColumnSelectorFactory factory = cursor.getColumnSelectorFactory();
+
+      DimensionSelector dimSelector = factory.makeDimensionSelector(DefaultDimensionSpec.of(OUTPUT_COLUMN_NAME));
+      IdLookup idlookUp = dimSelector.idLookup();
+      Assert.assertFalse(dimSelector.isNull());
+      int[] indices = new int[]{1, 3, 5};
+      int count = 0;
+      while (!cursor.isDone()) {
+        Object dimSelectorVal = dimSelector.getObject();
+        Assert.assertEquals(idlookUp.lookupId((String) dimSelectorVal), indices[count]);
+        // after unnest first entry in get row should equal the object
+        // and the row size will always be 1
+        Assert.assertEquals(dimSelector.getRow().get(0), indices[count]);
+        Assert.assertEquals(dimSelector.getRow().size(), 1);
+        Assert.assertNotNull(dimSelector.makeValueMatcher(OUTPUT_COLUMN_NAME));
+        cursor.advance();
+        count++;
+      }
+      Assert.assertEquals(dimSelector.getValueCardinality(), 3);
+      Assert.assertEquals(count, 3);
+      return null;
+    });
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/segment/data/SafeWritableBufferTest.java b/processing/src/test/java/org/apache/druid/segment/data/SafeWritableBufferTest.java
new file mode 100644
index 000000000000..f432b7c167ca
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/segment/data/SafeWritableBufferTest.java
@@ -0,0 +1,224 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment.data;
+
+import org.apache.datasketches.memory.Buffer;
+import org.apache.datasketches.memory.WritableBuffer;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
+public class SafeWritableBufferTest
+{
+  private static final int CAPACITY = 1024;
+
+  @Test
+  public void testPutAndGet()
+  {
+    WritableBuffer b1 = getBuffer();
+    Assert.assertEquals(0, b1.getPosition());
+    b1.putByte((byte) 0x01);
+    Assert.assertEquals(1, b1.getPosition());
+    b1.putBoolean(true);
+    Assert.assertEquals(2, b1.getPosition());
+    b1.putBoolean(false);
+    Assert.assertEquals(3, b1.getPosition());
+    b1.putChar('c');
+    Assert.assertEquals(5, b1.getPosition());
+    b1.putDouble(1.1);
+    Assert.assertEquals(13, b1.getPosition());
+    b1.putFloat(1.1f);
+    Assert.assertEquals(17, b1.getPosition());
+    b1.putInt(100);
+    Assert.assertEquals(21, b1.getPosition());
+    b1.putLong(1000L);
+    Assert.assertEquals(29, b1.getPosition());
+    b1.putShort((short) 15);
+    Assert.assertEquals(31, b1.getPosition());
+    b1.resetPosition();
+
+    Assert.assertEquals(0x01, b1.getByte());
+    Assert.assertTrue(b1.getBoolean());
+    Assert.assertFalse(b1.getBoolean());
+    Assert.assertEquals('c', b1.getChar());
+    Assert.assertEquals(1.1, b1.getDouble(), 0.0);
+    Assert.assertEquals(1.1f, b1.getFloat(), 0.0);
+    Assert.assertEquals(100, b1.getInt());
+    Assert.assertEquals(1000L, b1.getLong());
+    Assert.assertEquals(15, b1.getShort());
+  }
+
+  @Test
+  public void testPutAndGetArrays()
+  {
+    WritableBuffer buffer = getBuffer();
+    final byte[] b1 = new byte[]{0x01, 0x02, 0x08, 0x08};
+    final byte[] b2 = new byte[b1.length];
+
+    final boolean[] bool1 = new boolean[]{true, false, false, true};
+    final boolean[] bool2 = new boolean[bool1.length];
+
+    final char[] chars1 = new char[]{'a', 'b', 'c', 'd'};
+    final char[] chars2 = new char[chars1.length];
+
+    final double[] double1 = new double[]{1.1, -2.2, 3.3, 4.4};
+    final double[] double2 = new double[double1.length];
+
+    final float[] float1 = new float[]{1.1f, 2.2f, -3.3f, 4.4f};
+    final float[] float2 = new float[float1.length];
+
+    final int[] ints1 = new int[]{1, 2, -3, 4};
+    final int[] ints2 = new int[ints1.length];
+
+    final long[] longs1 = new long[]{1L, -2L, 3L, -14L};
+    final long[] longs2 = new long[ints1.length];
+
+    final short[] shorts1 = new short[]{1, -2, 3, -14};
+    final short[] shorts2 = new short[ints1.length];
+
+    buffer.putByteArray(b1, 0, 2);
+    buffer.putByteArray(b1, 2, b1.length - 2);
+    buffer.putBooleanArray(bool1, 0, bool1.length);
+    buffer.putCharArray(chars1, 0, chars1.length);
+    buffer.putDoubleArray(double1, 0, double1.length);
+    buffer.putFloatArray(float1, 0, float1.length);
+    buffer.putIntArray(ints1, 0, ints1.length);
+    buffer.putLongArray(longs1, 0, longs1.length);
+    buffer.putShortArray(shorts1, 0, shorts1.length);
+    long pos = buffer.getPosition();
+    buffer.resetPosition();
+    buffer.getByteArray(b2, 0, b1.length);
+    buffer.getBooleanArray(bool2, 0, bool1.length);
+    buffer.getCharArray(chars2, 0, chars1.length);
+    buffer.getDoubleArray(double2, 0, double1.length);
+    buffer.getFloatArray(float2, 0, float1.length);
+    buffer.getIntArray(ints2, 0, ints1.length);
+    buffer.getLongArray(longs2, 0, longs1.length);
+    buffer.getShortArray(shorts2, 0, shorts1.length);
+
+    Assert.assertArrayEquals(b1, b2);
+    Assert.assertArrayEquals(bool1, bool2);
+    Assert.assertArrayEquals(chars1, chars2);
+    for (int i = 0; i < double1.length; i++) {
+      Assert.assertEquals(double1[i], double2[i], 0.0);
+    }
+    for (int i = 0; i < float1.length; i++) {
+      Assert.assertEquals(float1[i], float2[i], 0.0);
+    }
+    Assert.assertArrayEquals(ints1, ints2);
+    Assert.assertArrayEquals(longs1, longs2);
+    Assert.assertArrayEquals(shorts1, shorts2);
+
+    Assert.assertEquals(pos, buffer.getPosition());
+  }
+
+  @Test
+  public void testStartEndRegionAndDuplicate()
+  {
+    WritableBuffer buffer = getBuffer();
+    Assert.assertEquals(0, buffer.getPosition());
+    Assert.assertEquals(0, buffer.getStart());
+    Assert.assertEquals(CAPACITY, buffer.getEnd());
+    Assert.assertEquals(CAPACITY, buffer.getRemaining());
+    Assert.assertEquals(CAPACITY, buffer.getCapacity());
+    Assert.assertTrue(buffer.hasRemaining());
+    buffer.fill((byte) 0x07);
+    buffer.setAndCheckStartPositionEnd(10L, 15L, 100L);
+    Assert.assertEquals(15L, buffer.getPosition());
+    Assert.assertEquals(10L, buffer.getStart());
+    Assert.assertEquals(100L, buffer.getEnd());
+    Assert.assertEquals(85L, buffer.getRemaining());
+    Assert.assertEquals(CAPACITY, buffer.getCapacity());
+    buffer.fill((byte) 0x70);
+    buffer.resetPosition();
+    Assert.assertEquals(10L, buffer.getPosition());
+    for (int i = 0; i < 90; i++) {
+      if (i < 5) {
+        Assert.assertEquals(0x07, buffer.getByte());
+      } else {
+        Assert.assertEquals(0x70, buffer.getByte());
+      }
+    }
+    buffer.setAndCheckPosition(50);
+
+    Buffer duplicate = buffer.duplicate();
+    Assert.assertEquals(buffer.getStart(), duplicate.getStart());
+    Assert.assertEquals(buffer.getPosition(), duplicate.getPosition());
+    Assert.assertEquals(buffer.getEnd(), duplicate.getEnd());
+    Assert.assertEquals(buffer.getRemaining(), duplicate.getRemaining());
+    Assert.assertEquals(buffer.getCapacity(), duplicate.getCapacity());
+
+    duplicate.resetPosition();
+    for (int i = 0; i < 90; i++) {
+      if (i < 5) {
+        Assert.assertEquals(0x07, duplicate.getByte());
+      } else {
+        Assert.assertEquals(0x70, duplicate.getByte());
+      }
+    }
+
+    Buffer region = buffer.region(5L, 105L, buffer.getTypeByteOrder());
+    Assert.assertEquals(0, region.getStart());
+    Assert.assertEquals(0, region.getPosition());
+    Assert.assertEquals(105L, region.getEnd());
+    Assert.assertEquals(105L, region.getRemaining());
+    Assert.assertEquals(105L, region.getCapacity());
+
+    for (int i = 0; i < 105; i++) {
+      if (i < 10) {
+        Assert.assertEquals(0x07, region.getByte());
+      } else if (i < 95) {
+        Assert.assertEquals(0x70, region.getByte());
+      } else {
+        Assert.assertEquals(0x07, region.getByte());
+      }
+    }
+  }
+
+  @Test
+  public void testFill()
+  {
+    WritableBuffer buffer = getBuffer();
+    WritableBuffer anotherBuffer = getBuffer();
+
+    buffer.fill((byte) 0x0F);
+    anotherBuffer.fill((byte) 0x0F);
+    Assert.assertTrue(buffer.equalTo(0L, anotherBuffer, 0L, CAPACITY));
+
+    anotherBuffer.setPosition(100);
+    anotherBuffer.clear();
+    Assert.assertFalse(buffer.equalTo(0L, anotherBuffer, 0L, CAPACITY));
+    Assert.assertTrue(buffer.equalTo(0L, anotherBuffer, 0L, 100L));
+  }
+
+  private WritableBuffer getBuffer()
+  {
+    return getBuffer(CAPACITY);
+  }
+
+  private WritableBuffer getBuffer(int capacity)
+  {
+    final ByteBuffer aBuffer = ByteBuffer.allocate(capacity).order(ByteOrder.LITTLE_ENDIAN);
+    SafeWritableBuffer memory = new SafeWritableBuffer(aBuffer);
+    return memory;
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/segment/data/SafeWritableMemoryTest.java b/processing/src/test/java/org/apache/druid/segment/data/SafeWritableMemoryTest.java
new file mode 100644
index 000000000000..786443f43ed6
--- /dev/null
+++ b/processing/src/test/java/org/apache/druid/segment/data/SafeWritableMemoryTest.java
@@ -0,0 +1,359 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.segment.data;
+
+import org.apache.datasketches.memory.Memory;
+import org.apache.datasketches.memory.WritableMemory;
+import org.apache.datasketches.memory.internal.UnsafeUtil;
+import org.junit.Assert;
+import org.junit.Test;
+
+import java.io.CharArrayWriter;
+import java.io.IOException;
+import java.nio.ByteBuffer;
+import java.nio.ByteOrder;
+
+public class SafeWritableMemoryTest
+{
+  private static final int CAPACITY = 1024;
+
+  @Test
+  public void testPutAndGet()
+  {
+    final WritableMemory memory = getMemory();
+    memory.putByte(3L, (byte) 0x01);
+    Assert.assertEquals(memory.getByte(3L), 0x01);
+
+    memory.putBoolean(1L, true);
+    Assert.assertTrue(memory.getBoolean(1L));
+    memory.putBoolean(1L, false);
+    Assert.assertFalse(memory.getBoolean(1L));
+
+    memory.putChar(10L, 'c');
+    Assert.assertEquals('c', memory.getChar(10L));
+
+    memory.putDouble(14L, 3.3);
+    Assert.assertEquals(3.3, memory.getDouble(14L), 0.0);
+
+    memory.putFloat(27L, 3.3f);
+    Assert.assertEquals(3.3f, memory.getFloat(27L), 0.0);
+
+    memory.putInt(11L, 1234);
+    Assert.assertEquals(1234, memory.getInt(11L));
+
+    memory.putLong(500L, 500L);
+    Assert.assertEquals(500L, memory.getLong(500L));
+
+    memory.putShort(11L, (short) 15);
+    Assert.assertEquals(15, memory.getShort(11L));
+
+    long l = memory.getAndSetLong(900L, 10L);
+    Assert.assertEquals(0L, l);
+    l = memory.getAndSetLong(900L, 100L);
+    Assert.assertEquals(10L, l);
+    l = memory.getAndAddLong(900L, 10L);
+    Assert.assertEquals(100L, l);
+    Assert.assertEquals(110L, memory.getLong(900L));
+    Assert.assertTrue(memory.compareAndSwapLong(900L, 110L, 120L));
+    Assert.assertFalse(memory.compareAndSwapLong(900L, 110L, 120L));
+    Assert.assertEquals(120L, memory.getLong(900L));
+  }
+
+  @Test
+  public void testPutAndGetArrays()
+  {
+    final WritableMemory memory = getMemory();
+    final byte[] b1 = new byte[]{0x01, 0x02, 0x08, 0x08};
+    final byte[] b2 = new byte[b1.length];
+    memory.putByteArray(12L, b1, 0, 3);
+    memory.putByteArray(15L, b1, 3, 1);
+    memory.getByteArray(12L, b2, 0, 3);
+    memory.getByteArray(15L, b2, 3, 1);
+    Assert.assertArrayEquals(b1, b2);
+
+    final boolean[] bool1 = new boolean[]{true, false, false, true};
+    final boolean[] bool2 = new boolean[bool1.length];
+    memory.putBooleanArray(100L, bool1, 0, 2);
+    memory.putBooleanArray(102L, bool1, 2, 2);
+    memory.getBooleanArray(100L, bool2, 0, 2);
+    memory.getBooleanArray(102L, bool2, 2, 2);
+    Assert.assertArrayEquals(bool1, bool2);
+
+    final char[] chars1 = new char[]{'a', 'b', 'c', 'd'};
+    final char[] chars2 = new char[chars1.length];
+    memory.putCharArray(10L, chars1, 0, 4);
+    memory.getCharArray(10L, chars2, 0, chars1.length);
+    Assert.assertArrayEquals(chars1, chars2);
+
+    final double[] double1 = new double[]{1.1, -2.2, 3.3, 4.4};
+    final double[] double2 = new double[double1.length];
+    memory.putDoubleArray(100L, double1, 0, 1);
+    memory.putDoubleArray(100L + Double.BYTES, double1, 1, 3);
+    memory.getDoubleArray(100L, double2, 0, 2);
+    memory.getDoubleArray(100L + (2 * Double.BYTES), double2, 2, 2);
+    for (int i = 0; i < double1.length; i++) {
+      Assert.assertEquals(double1[i], double2[i], 0.0);
+    }
+
+    final float[] float1 = new float[]{1.1f, 2.2f, -3.3f, 4.4f};
+    final float[] float2 = new float[float1.length];
+    memory.putFloatArray(100L, float1, 0, 1);
+    memory.putFloatArray(100L + Float.BYTES, float1, 1, 3);
+    memory.getFloatArray(100L, float2, 0, 2);
+    memory.getFloatArray(100L + (2 * Float.BYTES), float2, 2, 2);
+    for (int i = 0; i < float1.length; i++) {
+      Assert.assertEquals(float1[i], float2[i], 0.0);
+    }
+
+    final int[] ints1 = new int[]{1, 2, -3, 4};
+    final int[] ints2 = new int[ints1.length];
+    memory.putIntArray(100L, ints1, 0, 1);
+    memory.putIntArray(100L + Integer.BYTES, ints1, 1, 3);
+    memory.getIntArray(100L, ints2, 0, 2);
+    memory.getIntArray(100L + (2 * Integer.BYTES), ints2, 2, 2);
+    Assert.assertArrayEquals(ints1, ints2);
+
+    final long[] longs1 = new long[]{1L, -2L, 3L, -14L};
+    final long[] longs2 = new long[ints1.length];
+    memory.putLongArray(100L, longs1, 0, 1);
+    memory.putLongArray(100L + Long.BYTES, longs1, 1, 3);
+    memory.getLongArray(100L, longs2, 0, 2);
+    memory.getLongArray(100L + (2 * Long.BYTES), longs2, 2, 2);
+    Assert.assertArrayEquals(longs1, longs2);
+
+    final short[] shorts1 = new short[]{1, -2, 3, -14};
+    final short[] shorts2 = new short[ints1.length];
+    memory.putShortArray(100L, shorts1, 0, 1);
+    memory.putShortArray(100L + Short.BYTES, shorts1, 1, 3);
+    memory.getShortArray(100L, shorts2, 0, 2);
+    memory.getShortArray(100L + (2 * Short.BYTES), shorts2, 2, 2);
+    Assert.assertArrayEquals(shorts1, shorts2);
+  }
+
+  @Test
+  public void testFill()
+  {
+    final byte theByte = 0x01;
+    final byte anotherByte = 0x02;
+    final WritableMemory memory = getMemory();
+    final int halfWay = (int) (memory.getCapacity() / 2);
+
+    memory.fill(theByte);
+    for (int i = 0; i < memory.getCapacity(); i++) {
+      Assert.assertEquals(theByte, memory.getByte(i));
+    }
+
+    memory.fill(halfWay, memory.getCapacity() - halfWay, anotherByte);
+    for (int i = 0; i < memory.getCapacity(); i++) {
+      if (i < halfWay) {
+        Assert.assertEquals(theByte, memory.getByte(i));
+      } else {
+        Assert.assertEquals(anotherByte, memory.getByte(i));
+      }
+    }
+
+    memory.clear(halfWay, memory.getCapacity() - halfWay);
+    for (int i = 0; i < memory.getCapacity(); i++) {
+      if (i < halfWay) {
+        Assert.assertEquals(theByte, memory.getByte(i));
+      } else {
+        Assert.assertEquals(0, memory.getByte(i));
+      }
+    }
+
+    memory.setBits(halfWay - 1, anotherByte);
+    Assert.assertEquals(0x03, memory.getByte(halfWay - 1));
+    memory.clearBits(halfWay - 1, theByte);
+    Assert.assertEquals(anotherByte, memory.getByte(halfWay - 1));
+
+    memory.clear();
+    for (int i = 0; i < memory.getCapacity(); i++) {
+      Assert.assertEquals(0, memory.getByte(i));
+    }
+  }
+
+  @Test
+  public void testStringStuff() throws IOException
+  {
+    WritableMemory memory = getMemory();
+    String s1 = "hello ";
+    memory.putCharsToUtf8(10L, s1);
+
+    StringBuilder builder = new StringBuilder();
+    memory.getCharsFromUtf8(10L, s1.length(), builder);
+    Assert.assertEquals(s1, builder.toString());
+
+    CharArrayWriter someAppendable = new CharArrayWriter();
+    memory.getCharsFromUtf8(10L, s1.length(), someAppendable);
+    Assert.assertEquals(s1, someAppendable.toString());
+  }
+
+  @Test
+  public void testRegion()
+  {
+    WritableMemory memory = getMemory();
+    Assert.assertEquals(CAPACITY, memory.getCapacity());
+    Assert.assertEquals(0, memory.getCumulativeOffset());
+    Assert.assertEquals(10L, memory.getCumulativeOffset(10L));
+    Assert.assertThrows(
+        IllegalArgumentException.class,
+        () -> memory.checkValidAndBounds(CAPACITY - 10, 11L)
+    );
+
+    final byte[] someBytes = new byte[]{0x01, 0x02, 0x03, 0x04};
+    memory.putByteArray(10L, someBytes, 0, someBytes.length);
+
+    Memory region = memory.region(10L, someBytes.length);
+    Assert.assertEquals(someBytes.length, region.getCapacity());
+    Assert.assertEquals(0, region.getCumulativeOffset());
+    Assert.assertEquals(2L, region.getCumulativeOffset(2L));
+    Assert.assertThrows(
+        IllegalArgumentException.class,
+        () -> region.checkValidAndBounds(2L, 4L)
+    );
+
+    final byte[] andBack = new byte[someBytes.length];
+    region.getByteArray(0L, andBack, 0, someBytes.length);
+    Assert.assertArrayEquals(someBytes, andBack);
+
+    Memory differentOrderRegion = memory.region(10L, someBytes.length, ByteOrder.BIG_ENDIAN);
+    // different order
+    Assert.assertFalse(region.isByteOrderCompatible(differentOrderRegion.getTypeByteOrder()));
+    // contents are equal tho
+    Assert.assertTrue(region.equalTo(0L, differentOrderRegion, 0L, someBytes.length));
+  }
+
+  @Test
+  public void testCompareAndEquals()
+  {
+    WritableMemory memory = getMemory();
+    final byte[] someBytes = new byte[]{0x01, 0x02, 0x03, 0x04};
+    final byte[] shorterSameBytes = new byte[]{0x01, 0x02, 0x03};
+    final byte[] differentBytes = new byte[]{0x02, 0x02, 0x03, 0x04};
+    memory.putByteArray(10L, someBytes, 0, someBytes.length);
+    memory.putByteArray(400L, someBytes, 0, someBytes.length);
+    memory.putByteArray(200L, shorterSameBytes, 0, shorterSameBytes.length);
+    memory.putByteArray(500L, differentBytes, 0, differentBytes.length);
+
+    Assert.assertEquals(0, memory.compareTo(10L, someBytes.length, memory, 400L, someBytes.length));
+    Assert.assertEquals(4, memory.compareTo(10L, someBytes.length, memory, 200L, someBytes.length));
+    Assert.assertEquals(-1, memory.compareTo(10L, someBytes.length, memory, 500L, differentBytes.length));
+
+    WritableMemory memory2 = getMemory();
+    memory2.putByteArray(0L, someBytes, 0, someBytes.length);
+
+    Assert.assertEquals(0, memory.compareTo(10L, someBytes.length, memory2, 0L, someBytes.length));
+
+    Assert.assertTrue(memory.equalTo(10L, memory2, 0L, someBytes.length));
+
+    WritableMemory memory3 = getMemory();
+    memory2.copyTo(0L, memory3, 0L, CAPACITY);
+    Assert.assertTrue(memory2.equalTo(0L, memory3, 0L, CAPACITY));
+  }
+
+  @Test
+  public void testHash()
+  {
+    WritableMemory memory = getMemory();
+    final long[] someLongs = new long[]{1L, 10L, 100L, 1000L, 10000L};
+    final int[] someInts = new int[]{1, 2, 3};
+    final byte[] someBytes = new byte[]{0x01, 0x02, 0x03};
+    final int longsLength = Long.BYTES * someLongs.length;
+    final int someIntsLength = Integer.BYTES * someInts.length;
+    final int totalLength = longsLength + someIntsLength + someBytes.length;
+    memory.putLongArray(2L, someLongs, 0, someLongs.length);
+    memory.putIntArray(2L + longsLength, someInts, 0, someInts.length);
+    memory.putByteArray(2L + longsLength + someIntsLength, someBytes, 0, someBytes.length);
+    Memory memory2 = Memory.wrap(memory.getByteBuffer(), ByteOrder.LITTLE_ENDIAN);
+    Assert.assertEquals(
+        memory2.xxHash64(2L, totalLength, 0),
+        memory.xxHash64(2L, totalLength, 0)
+    );
+
+    Assert.assertEquals(
+        memory2.xxHash64(2L, 0),
+        memory.xxHash64(2L, 0)
+    );
+  }
+
+  @Test
+  public void testToHexString()
+  {
+
+    final byte[] bytes = new byte[]{0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07};
+    final WritableMemory memory = getMemory(bytes.length);
+    memory.putByteArray(0L, bytes, 0, bytes.length);
+    final long hcode = memory.hashCode() & 0XFFFFFFFFL;
+    final long bufferhcode = memory.getByteBuffer().hashCode() & 0XFFFFFFFFL;
+    final long reqhcode = memory.getMemoryRequestServer().hashCode() & 0XFFFFFFFFL;
+    Assert.assertEquals(
+        "### SafeWritableMemory SUMMARY ###\n"
+        + "Header Comment      : test memory dump\n"
+        + "Call Parameters     : .toHexString(..., 0, 8), hashCode: " + hcode + "\n"
+        + "UnsafeObj, hashCode : null\n"
+        + "UnsafeObjHeader     : 0\n"
+        + "ByteBuf, hashCode   : HeapByteBuffer, " + bufferhcode + "\n"
+        + "RegionOffset        : 0\n"
+        + "Capacity            : 8\n"
+        + "CumBaseOffset       : 0\n"
+        + "MemReq, hashCode    : HeapByteBufferMemoryRequestServer, " + reqhcode + "\n"
+        + "Valid               : true\n"
+        + "Read Only           : false\n"
+        + "Type Byte Order     : LITTLE_ENDIAN\n"
+        + "Native Byte Order   : LITTLE_ENDIAN\n"
+        + "JDK Runtime Version : " + UnsafeUtil.JDK + "\n"
+        + "Data, littleEndian  :  0  1  2  3  4  5  6  7\n"
+        + "                   0: 00 01 02 03 04 05 06 07 \n",
+        memory.toHexString("test memory dump", 0, bytes.length)
+    );
+  }
+
+  @Test
+  public void testMisc()
+  {
+    WritableMemory memory = getMemory(10);
+    WritableMemory memory2 = memory.getMemoryRequestServer().request(memory, 20);
+    Assert.assertEquals(20, memory2.getCapacity());
+
+    Assert.assertFalse(memory2.hasArray());
+
+    Assert.assertFalse(memory2.isReadOnly());
+    Assert.assertFalse(memory2.isDirect());
+    Assert.assertTrue(memory2.isValid());
+    Assert.assertTrue(memory2.hasByteBuffer());
+
+    Assert.assertFalse(memory2.isSameResource(memory));
+    Assert.assertTrue(memory2.isSameResource(memory2));
+
+    // does nothing
+    memory.getMemoryRequestServer().requestClose(memory, memory2);
+  }
+
+  private WritableMemory getMemory()
+  {
+    return getMemory(CAPACITY);
+  }
+
+  private WritableMemory getMemory(int capacity)
+  {
+    final ByteBuffer aBuffer = ByteBuffer.allocate(capacity).order(ByteOrder.LITTLE_ENDIAN);
+    return SafeWritableMemory.wrap(aBuffer);
+  }
+}
diff --git a/processing/src/test/java/org/apache/druid/segment/nested/NestedDataColumnSupplierTest.java b/processing/src/test/java/org/apache/druid/segment/nested/NestedDataColumnSupplierTest.java
index 98dc97731f5c..b0396c9293f3 100644
--- a/processing/src/test/java/org/apache/druid/segment/nested/NestedDataColumnSupplierTest.java
+++ b/processing/src/test/java/org/apache/druid/segment/nested/NestedDataColumnSupplierTest.java
@@ -357,7 +357,7 @@ public int write(ByteBuffer buffer, int offset, T value, int maxSizeBytes)
     }
 
     @Override
-    public int compare(T o1, T o2)
+    public int compare(Object o1, Object o2)
     {
       return delegate.compare(o1, o2);
     }
diff --git a/processing/src/test/java/org/apache/druid/segment/nested/NestedFieldLiteralColumnIndexSupplierTest.java b/processing/src/test/java/org/apache/druid/segment/nested/NestedFieldLiteralColumnIndexSupplierTest.java
index 15b40b729f07..25fec68bb82b 100644
--- a/processing/src/test/java/org/apache/druid/segment/nested/NestedFieldLiteralColumnIndexSupplierTest.java
+++ b/processing/src/test/java/org/apache/druid/segment/nested/NestedFieldLiteralColumnIndexSupplierTest.java
@@ -89,6 +89,9 @@ public void setup() throws IOException
     stringWriter.write("fo");
     stringWriter.write("foo");
     stringWriter.write("fooo");
+    stringWriter.write("g");
+    stringWriter.write("gg");
+    stringWriter.write("ggg");
     stringWriter.write("z");
     writeToBuffer(stringBuffer, stringWriter);
 
@@ -197,13 +200,44 @@ public void testSingleTypeStringColumnRangeIndex() throws IOException
     Assert.assertNotNull(rangeIndex);
 
     // 10 rows
+    // global: [null, a, b, fo, foo, fooo, g, gg, ggg, z]
     // local: [b, foo, fooo, z]
     // column: [foo, b, fooo, b, z, fooo, z, b, b, foo]
 
-    BitmapColumnIndex forRange = rangeIndex.forRange("f", true, "g", true);
+    BitmapColumnIndex forRange = rangeIndex.forRange(null, false, "a", false);
     Assert.assertNotNull(forRange);
-    Assert.assertEquals(0.4, forRange.estimateSelectivity(10), 0.0);
+    Assert.assertEquals(0.0, forRange.estimateSelectivity(10), 0.0);
     ImmutableBitmap bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap);
+
+    forRange = rangeIndex.forRange(null, false, "b", false);
+    Assert.assertNotNull(forRange);
+    Assert.assertEquals(0.4, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap, 1, 3, 7, 8);
+
+    forRange = rangeIndex.forRange("b", false, "fon", false);
+    Assert.assertNotNull(forRange);
+    Assert.assertEquals(0.4, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap, 1, 3, 7, 8);
+
+    forRange = rangeIndex.forRange("bb", false, "fon", false);
+    Assert.assertNotNull(forRange);
+    Assert.assertEquals(0.0, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap);
+
+    forRange = rangeIndex.forRange("b", true, "foo", false);
+    Assert.assertNotNull(forRange);
+    Assert.assertEquals(0.2, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap, 0, 9);
+
+    forRange = rangeIndex.forRange("f", true, "g", true);
+    Assert.assertNotNull(forRange);
+    Assert.assertEquals(0.4, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
     checkBitmap(bitmap, 0, 2, 5, 9);
 
     forRange = rangeIndex.forRange(null, false, "g", true);
@@ -257,6 +291,36 @@ public void testSingleTypeStringColumnRangeIndex() throws IOException
     Assert.assertEquals(1.0, forRange.estimateSelectivity(10), 0.0);
     bitmap = forRange.computeBitmapResult(bitmapResultFactory);
     checkBitmap(bitmap, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9);
+
+    forRange = rangeIndex.forRange(null, true, "foa", false);
+    Assert.assertEquals(0.4, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap, 1, 3, 7, 8);
+
+    forRange = rangeIndex.forRange(null, true, "foooa", false);
+    Assert.assertEquals(0.8, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap, 0, 1, 2, 3, 5, 7, 8, 9);
+
+    forRange = rangeIndex.forRange("foooa", true, "ggg", false);
+    Assert.assertEquals(0.0, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap);
+
+    forRange = rangeIndex.forRange("g", true, "gg", false);
+    Assert.assertEquals(0.0, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap);
+
+    forRange = rangeIndex.forRange("z", true, "zz", false);
+    Assert.assertEquals(0.0, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap);
+
+    forRange = rangeIndex.forRange("z", false, "zz", false);
+    Assert.assertEquals(0.2, forRange.estimateSelectivity(10), 0.0);
+    bitmap = forRange.computeBitmapResult(bitmapResultFactory);
+    checkBitmap(bitmap, 4, 6);
   }
 
   @Test
@@ -1123,7 +1187,7 @@ private NestedFieldLiteralColumnIndexSupplier<?> makeSingleTypeStringSupplier()
 
     // 10 rows
     // globals: [
-    //    [null, a, b, fo, foo, fooo, z],
+    //    [null, a, b, fo, foo, fooo, g, gg, ggg, z],
     //    [1, 2, 3, 5, 100, 300, 9000],
     //    [1.0, 1.1, 1.2, 2.0, 2.5, 3.3, 6.6, 9.9]
     // ]
@@ -1143,7 +1207,7 @@ private NestedFieldLiteralColumnIndexSupplier<?> makeSingleTypeStringSupplier()
     bitmapWriter.write(fillBitmap(2, 5));
 
     // z
-    localDictionaryWriter.write(6);
+    localDictionaryWriter.write(9);
     bitmapWriter.write(fillBitmap(4, 6));
 
     writeToBuffer(localDictionaryBuffer, localDictionaryWriter);
@@ -1193,7 +1257,7 @@ private NestedFieldLiteralColumnIndexSupplier<?> makeSingleTypeStringWithNullsSu
     bitmapWriter.open();
     // 10 rows
     // globals: [
-    //    [null, a, b, fo, foo, fooo, z],
+    //    [null, a, b, fo, foo, fooo, g, gg, ggg, z],
     //    [1, 2, 3, 5, 100, 300, 9000],
     //    [1.0, 1.1, 1.2, 2.0, 2.5, 3.3, 6.6, 9.9]
     // ]
@@ -1217,7 +1281,7 @@ private NestedFieldLiteralColumnIndexSupplier<?> makeSingleTypeStringWithNullsSu
     bitmapWriter.write(fillBitmap(2, 5));
 
     // z
-    localDictionaryWriter.write(6);
+    localDictionaryWriter.write(9);
     bitmapWriter.write(fillBitmap(4, 6));
 
     writeToBuffer(localDictionaryBuffer, localDictionaryWriter);
@@ -1276,19 +1340,19 @@ private NestedFieldLiteralColumnIndexSupplier<?> makeSingleTypeLongSupplier() th
     // column: [100, 1, 300, 1, 3, 3, 100, 300, 300, 1]
 
     // 1
-    localDictionaryWriter.write(7);
+    localDictionaryWriter.write(10);
     bitmapWriter.write(fillBitmap(1, 3, 9));
 
     // 3
-    localDictionaryWriter.write(9);
+    localDictionaryWriter.write(12);
     bitmapWriter.write(fillBitmap(4, 5));
 
     // 100
-    localDictionaryWriter.write(11);
+    localDictionaryWriter.write(14);
     bitmapWriter.write(fillBitmap(0, 6));
 
     // 300
-    localDictionaryWriter.write(12);
+    localDictionaryWriter.write(15);
     bitmapWriter.write(fillBitmap(2, 7, 8));
 
     writeToBuffer(localDictionaryBuffer, localDictionaryWriter);
@@ -1351,19 +1415,19 @@ private NestedFieldLiteralColumnIndexSupplier<?> makeSingleTypeLongSupplierWithN
     bitmapWriter.write(fillBitmap(2, 5, 8));
 
     // 1
-    localDictionaryWriter.write(7);
+    localDictionaryWriter.write(10);
     bitmapWriter.write(fillBitmap(1, 3, 9));
 
     // 3
-    localDictionaryWriter.write(9);
+    localDictionaryWriter.write(12);
     bitmapWriter.write(fillBitmap(4));
 
     // 100
-    localDictionaryWriter.write(11);
+    localDictionaryWriter.write(14);
     bitmapWriter.write(fillBitmap(0, 6));
 
     // 300
-    localDictionaryWriter.write(12);
+    localDictionaryWriter.write(15);
     bitmapWriter.write(fillBitmap(7));
 
     writeToBuffer(localDictionaryBuffer, localDictionaryWriter);
@@ -1422,19 +1486,19 @@ private NestedFieldLiteralColumnIndexSupplier<?> makeSingleTypeDoubleSupplier()
     // column: [1.1, 1.1, 1.2, 3.3, 1.2, 6.6, 3.3, 1.2, 1.1, 3.3]
 
     // 1.1
-    localDictionaryWriter.write(15);
+    localDictionaryWriter.write(18);
     bitmapWriter.write(fillBitmap(0, 1, 8));
 
     // 1.2
-    localDictionaryWriter.write(16);
+    localDictionaryWriter.write(19);
     bitmapWriter.write(fillBitmap(2, 4, 7));
 
     // 3.3
-    localDictionaryWriter.write(19);
+    localDictionaryWriter.write(22);
     bitmapWriter.write(fillBitmap(3, 6, 9));
 
     // 6.6
-    localDictionaryWriter.write(20);
+    localDictionaryWriter.write(23);
     bitmapWriter.write(fillBitmap(5));
 
     writeToBuffer(localDictionaryBuffer, localDictionaryWriter);
@@ -1497,19 +1561,19 @@ private NestedFieldLiteralColumnIndexSupplier<?> makeSingleTypeDoubleSupplierWit
     bitmapWriter.write(fillBitmap(1, 3, 6));
 
     // 1.1
-    localDictionaryWriter.write(15);
+    localDictionaryWriter.write(18);
     bitmapWriter.write(fillBitmap(0, 8));
 
     // 1.2
-    localDictionaryWriter.write(16);
+    localDictionaryWriter.write(19);
     bitmapWriter.write(fillBitmap(2, 4, 7));
 
     // 3.3
-    localDictionaryWriter.write(19);
+    localDictionaryWriter.write(22);
     bitmapWriter.write(fillBitmap(9));
 
     // 6.6
-    localDictionaryWriter.write(20);
+    localDictionaryWriter.write(23);
     bitmapWriter.write(fillBitmap(5));
 
     writeToBuffer(localDictionaryBuffer, localDictionaryWriter);
@@ -1576,23 +1640,23 @@ private NestedFieldLiteralColumnIndexSupplier<?> makeVariantSupplierWithNull() t
     bitmapWriter.write(fillBitmap(1, 9));
 
     // z
-    localDictionaryWriter.write(6);
+    localDictionaryWriter.write(9);
     bitmapWriter.write(fillBitmap(6));
 
     // 1
-    localDictionaryWriter.write(7);
+    localDictionaryWriter.write(10);
     bitmapWriter.write(fillBitmap(0, 5));
 
     // 300
-    localDictionaryWriter.write(12);
+    localDictionaryWriter.write(15);
     bitmapWriter.write(fillBitmap(4));
 
     // 1.1
-    localDictionaryWriter.write(15);
+    localDictionaryWriter.write(18);
     bitmapWriter.write(fillBitmap(8));
 
     // 9.9
-    localDictionaryWriter.write(21);
+    localDictionaryWriter.write(24);
     bitmapWriter.write(fillBitmap(3));
 
     writeToBuffer(localDictionaryBuffer, localDictionaryWriter);
diff --git a/server/pom.xml b/server/pom.xml
index d4bafbb23b9f..14e1e5745782 100644
--- a/server/pom.xml
+++ b/server/pom.xml
@@ -28,7 +28,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
     </parent>
 
     <dependencies>
@@ -454,8 +454,9 @@
                     <excludes>
                         <!-- There are UTs for this class but it is very difficult to get required branch coverage -->
                         <exclude>org/apache/druid/metadata/BasicDataSourceExt.class</exclude>
-                        <!-- Tested in the SQL layer, but, oddly, not in this module. -->
+                      <!-- Tested in the SQL layer, but, oddly, not in this module. -->
                         <exclude>org/apache/druid/server/QueryResponse.class</exclude>
+                        <exclude>org/apache/druid/curator/CuratorModule.class</exclude>
                     </excludes>
                 </configuration>
             </plugin>
diff --git a/server/src/main/java/org/apache/druid/catalog/model/ModelProperties.java b/server/src/main/java/org/apache/druid/catalog/model/ModelProperties.java
index 07c9be973e00..cedd8c9e807a 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/ModelProperties.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/ModelProperties.java
@@ -21,15 +21,17 @@
 
 import com.fasterxml.jackson.core.type.TypeReference;
 import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.base.Preconditions;
+import com.google.common.collect.ImmutableMap;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.PeriodGranularity;
 import org.joda.time.Period;
 
 import java.util.ArrayList;
+import java.util.Arrays;
 import java.util.HashSet;
 import java.util.List;
+import java.util.Map;
 import java.util.Set;
 
 /**
@@ -46,8 +48,28 @@ public interface ModelProperties
 {
   interface PropertyDefn<T>
   {
+    /**
+     * Name of the property as visible to catalog users. All properties are top-level within
+     * the {@code properties} object within a catalog spec.
+     */
     String name();
+
+    /**
+     * Metadata about properties, such as how they apply to SQL table functions.
+     *
+     * @see {@link PropertyAttributes} for details.
+     */
+    Map<String, Object> attributes();
+
+    /**
+     * The name of the type of this property to be displayed in error messages.
+     */
     String typeName();
+
+    /**
+     * Validates that the object given is valid for this property. Provides the JSON
+     * mapper in case JSON decoding is required.
+     */
     void validate(Object value, ObjectMapper jsonMapper);
 
     /**
@@ -57,16 +79,32 @@ interface PropertyDefn<T>
      * value.
      */
     Object merge(Object existing, Object update);
+
+    /**
+     * Decodes a JSON-encoded value into a corresponding Java value.
+     */
     T decode(Object value, ObjectMapper jsonMapper);
+
+    /**
+     * Decodes a SQL-encoded value into a corresponding Java value.
+     */
+    T decodeSqlValue(Object value, ObjectMapper jsonMapper);
   }
 
   abstract class BasePropertyDefn<T> implements PropertyDefn<T>
   {
     protected final String name;
+    protected final Map<String, Object> attributes;
 
-    public BasePropertyDefn(final String name)
+    public BasePropertyDefn(final String name, Map<String, Object> attributes)
     {
       this.name = name;
+      this.attributes = attributes == null ? ImmutableMap.of() : attributes;
+    }
+
+    public BasePropertyDefn(final String name)
+    {
+      this(name, null);
     }
 
     @Override
@@ -75,41 +113,63 @@ public String name()
       return name;
     }
 
+    @Override
+    public Map<String, Object> attributes()
+    {
+      return attributes;
+    }
+
+    @Override
+    public String typeName()
+    {
+      return PropertyAttributes.typeName(this);
+    }
+
     @Override
     public Object merge(Object existing, Object update)
     {
       return update == null ? existing : update;
     }
 
+    @Override
+    public T decodeSqlValue(Object value, ObjectMapper jsonMapper)
+    {
+      return decode(value, jsonMapper);
+    }
+
     @Override
     public String toString()
     {
       return getClass().getSimpleName() + "{"
           + "name: " + name
-          + ", type: " + typeName()
+          + ", attributes: " + attributes()
           + "}";
     }
   }
 
-  class SimplePropertyDefn<T> extends BasePropertyDefn<T>
+  abstract class SimplePropertyDefn<T> extends BasePropertyDefn<T>
   {
     public final Class<T> valueClass;
 
     public SimplePropertyDefn(
         final String name,
-        final Class<T> valueClass
+        final Class<T> valueClass,
+        final Map<String, Object> attribs
     )
     {
-      super(name);
+      super(
+          name,
+          PropertyAttributes.merge(
+              ImmutableMap.of(
+                PropertyAttributes.TYPE_NAME,
+                valueClass.getSimpleName()
+              ),
+              attribs
+          )
+      );
       this.valueClass = valueClass;
     }
 
-    @Override
-    public String typeName()
-    {
-      return valueClass.getSimpleName();
-    }
-
     /**
      * Convert the value from the deserialized JSON format to the type
      * required by this field data type. Also used to decode values from
@@ -144,30 +204,49 @@ public void validate(Object value, ObjectMapper jsonMapper)
     {
       decode(value, jsonMapper);
     }
+
+    protected T decodeJson(Object value, ObjectMapper jsonMapper)
+    {
+      if (value == null) {
+        return null;
+      }
+      try {
+        return jsonMapper.readValue((String) value, valueClass);
+      }
+      catch (Exception e) {
+        throw new IAE(
+            "Value [%s] is not valid for property [%s]",
+            value,
+            name
+        );
+      }
+    }
   }
 
   class TypeRefPropertyDefn<T> extends BasePropertyDefn<T>
   {
-    public final String typeName;
     public final TypeReference<T> valueType;
 
     public TypeRefPropertyDefn(
         final String name,
         final String typeName,
-        final TypeReference<T> valueType
+        final TypeReference<T> valueType,
+        final Map<String, Object> attribs
     )
     {
-      super(name);
-      this.typeName = Preconditions.checkNotNull(typeName);
+      super(
+          name,
+          PropertyAttributes.merge(
+              ImmutableMap.of(
+                PropertyAttributes.TYPE_NAME,
+                typeName
+              ),
+              attribs
+          )
+      );
       this.valueType = valueType;
     }
 
-    @Override
-    public String typeName()
-    {
-      return typeName;
-    }
-
     @Override
     public T decode(Object value, ObjectMapper jsonMapper)
     {
@@ -202,17 +281,27 @@ public void validate(Object value, ObjectMapper jsonMapper)
 
   class StringPropertyDefn extends SimplePropertyDefn<String>
   {
-    public StringPropertyDefn(String name)
+    public StringPropertyDefn(String name, Map<String, Object> attribs)
     {
-      super(name, String.class);
+      super(
+          name,
+          String.class,
+          PropertyAttributes.merge(
+              ImmutableMap.of(
+                  PropertyAttributes.SQL_JAVA_TYPE,
+                  String.class
+              ),
+              attribs
+          )
+      );
     }
   }
 
   class GranularityPropertyDefn extends StringPropertyDefn
   {
-    public GranularityPropertyDefn(String name)
+    public GranularityPropertyDefn(String name, Map<String, Object> attribs)
     {
-      super(name);
+      super(name, attribs);
     }
 
     @Override
@@ -239,17 +328,37 @@ public void validateGranularity(String value)
 
   class IntPropertyDefn extends SimplePropertyDefn<Integer>
   {
-    public IntPropertyDefn(String name)
+    public IntPropertyDefn(String name, Map<String, Object> attribs)
     {
-      super(name, Integer.class);
+      super(
+          name,
+          Integer.class,
+          PropertyAttributes.merge(
+              ImmutableMap.of(
+                  PropertyAttributes.SQL_JAVA_TYPE,
+                  Integer.class
+              ),
+              attribs
+          )
+      );
     }
   }
 
   class BooleanPropertyDefn extends SimplePropertyDefn<Boolean>
   {
-    public BooleanPropertyDefn(String name)
+    public BooleanPropertyDefn(String name, Map<String, Object> attribs)
     {
-      super(name, Boolean.class);
+      super(
+          name,
+          Boolean.class,
+          PropertyAttributes.merge(
+              ImmutableMap.of(
+                  PropertyAttributes.SQL_JAVA_TYPE,
+                  Boolean.class
+              ),
+              attribs
+          )
+      );
     }
   }
 
@@ -258,10 +367,11 @@ class ListPropertyDefn<T> extends TypeRefPropertyDefn<List<T>>
     public ListPropertyDefn(
         final String name,
         final String typeName,
-        final TypeReference<List<T>> valueType
+        final TypeReference<List<T>> valueType,
+        final Map<String, Object> attribs
     )
     {
-      super(name, typeName, valueType);
+      super(name, typeName, valueType, attribs);
     }
 
     @SuppressWarnings("unchecked")
@@ -300,13 +410,33 @@ public Object merge(Object existing, Object updates)
 
   class StringListPropertyDefn extends ListPropertyDefn<String>
   {
-    public StringListPropertyDefn(String name)
+    public StringListPropertyDefn(
+        final String name,
+        final Map<String, Object> attribs
+    )
     {
       super(
           name,
           "string list",
-          new TypeReference<List<String>>() {}
+          new TypeReference<List<String>>() {},
+          PropertyAttributes.merge(
+              ImmutableMap.of(
+                  PropertyAttributes.SQL_JAVA_TYPE,
+                  String.class
+              ),
+              attribs
+          )
       );
     }
+
+    @Override
+    public List<String> decodeSqlValue(Object value, ObjectMapper jsonMapper)
+    {
+      if (!(value instanceof String)) {
+        throw new IAE(StringUtils.format("Argument [%s] is not a VARCHAR", value));
+      }
+      String[] values = ((String) value).split(",\\s*");
+      return Arrays.asList(values);
+    }
   }
 }
diff --git a/server/src/main/java/org/apache/druid/catalog/model/ParameterizedDefn.java b/server/src/main/java/org/apache/druid/catalog/model/ParameterizedDefn.java
index 007fd43766b6..473afc820a0a 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/ParameterizedDefn.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/ParameterizedDefn.java
@@ -19,6 +19,7 @@
 
 package org.apache.druid.catalog.model;
 
+import org.apache.druid.catalog.model.ModelProperties.PropertyDefn;
 import org.apache.druid.catalog.model.table.ExternalTableSpec;
 
 import java.util.List;
@@ -33,37 +34,6 @@
  */
 public interface ParameterizedDefn
 {
-  interface ParameterDefn
-  {
-    String name();
-    Class<?> valueClass();
-  }
-
-  class ParameterImpl implements ParameterDefn
-  {
-    private final String name;
-    private final Class<?> type;
-
-    public ParameterImpl(final String name, final Class<?> type)
-    {
-      this.name = name;
-      this.type = type;
-    }
-
-    @Override
-    public String name()
-    {
-      return name;
-    }
-
-    @Override
-    public Class<?> valueClass()
-    {
-      return type;
-    }
-  }
-
-  List<ParameterDefn> parameters();
-  ParameterDefn parameter(String name);
+  List<PropertyDefn<?>> parameters();
   ExternalTableSpec applyParameters(ResolvedTable table, Map<String, Object> parameters);
 }
diff --git a/server/src/main/java/org/apache/druid/catalog/model/PropertyAttributes.java b/server/src/main/java/org/apache/druid/catalog/model/PropertyAttributes.java
new file mode 100644
index 000000000000..af7820ed6af7
--- /dev/null
+++ b/server/src/main/java/org/apache/druid/catalog/model/PropertyAttributes.java
@@ -0,0 +1,110 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.catalog.model;
+
+import com.google.common.collect.ImmutableMap;
+import org.apache.druid.catalog.model.ModelProperties.PropertyDefn;
+
+import java.util.HashMap;
+import java.util.Map;
+
+/**
+ * Definition and access of attributes of table definition properties. These
+ * are meta-attributes: attributes of attributes. These are primarily used to
+ * indicate the role of each table property when used in a SQL table function.
+ */
+public class PropertyAttributes
+{
+  /**
+   * If set to {@code true}, then the property is also a SQL function parameter.
+   */
+  public static final String IS_SQL_FN_PARAM_KEY = "sqlFnArg";
+  /**
+   * If set to {@code true}, then this SQL function parameter is optional. That is,
+   * it can take a SQL {@code NULL} value if parameters are listed in order, or can
+   * be ommited if parameters are provided by name.
+   */
+  public static final String IS_SQL_FN_OPTIONAL = "optional";
+  public static final String IS_PARAMETER = "param";
+
+  /**
+   * The type name to display in error messages.
+   */
+  public static final String TYPE_NAME = "typeName";
+
+  /**
+   * The type to use when creating a SQL function parameter.
+   */
+  public static final String SQL_JAVA_TYPE = "sqlJavaType";
+
+  public static final Map<String, Object> SQL_FN_PARAM =
+      ImmutableMap.of(IS_SQL_FN_PARAM_KEY, true);
+  public static final Map<String, Object> OPTIONAL_SQL_FN_PARAM =
+      ImmutableMap.of(IS_SQL_FN_PARAM_KEY, true, IS_SQL_FN_OPTIONAL, true);
+  public static final Map<String, Object> TABLE_PARAM =
+      ImmutableMap.of(IS_PARAMETER, true);
+  public static final Map<String, Object> SQL_AND_TABLE_PARAM =
+      ImmutableMap.of(IS_SQL_FN_PARAM_KEY, true, IS_PARAMETER, true);
+
+  private static boolean getBoolean(PropertyDefn<?> defn, String key)
+  {
+    Object value = defn.attributes().get(key);
+    return value != null && (Boolean) value;
+  }
+
+  public static boolean isSqlFunctionParameter(PropertyDefn<?> defn)
+  {
+    return getBoolean(defn, IS_SQL_FN_PARAM_KEY);
+  }
+
+  public static boolean isOptional(PropertyDefn<?> defn)
+  {
+    return getBoolean(defn, IS_SQL_FN_OPTIONAL);
+  }
+
+  public static String typeName(PropertyDefn<?> defn)
+  {
+    return (String) defn.attributes().get(TYPE_NAME);
+  }
+
+  public static Class<?> sqlParameterType(PropertyDefn<?> defn)
+  {
+    return (Class<?>) defn.attributes().get(SQL_JAVA_TYPE);
+  }
+
+  public static boolean isExternTableParameter(PropertyDefn<?> defn)
+  {
+    return getBoolean(defn, IS_PARAMETER);
+  }
+
+  public static Map<String, Object> merge(Map<String, Object> attribs1, Map<String, Object> attribs2)
+  {
+    if (attribs1 == null) {
+      return attribs2;
+    }
+    if (attribs2 == null) {
+      return attribs1;
+    }
+
+    Map<String, Object> merged = new HashMap<>(attribs1);
+    merged.putAll(attribs2);
+    return ImmutableMap.copyOf(merged);
+  }
+}
diff --git a/server/src/main/java/org/apache/druid/catalog/model/TableDefn.java b/server/src/main/java/org/apache/druid/catalog/model/TableDefn.java
index 2916aabe885f..86d0d4394c5e 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/TableDefn.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/TableDefn.java
@@ -61,7 +61,7 @@ public TableDefn(
         typeValue,
         CatalogUtils.concatLists(
             Collections.singletonList(
-                new ModelProperties.StringPropertyDefn(DESCRIPTION_PROPERTY)
+                new ModelProperties.StringPropertyDefn(DESCRIPTION_PROPERTY, null)
             ),
             properties
         )
diff --git a/server/src/main/java/org/apache/druid/catalog/model/TableDefnRegistry.java b/server/src/main/java/org/apache/druid/catalog/model/TableDefnRegistry.java
index 7e952a4393a3..f0e789cae416 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/TableDefnRegistry.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/TableDefnRegistry.java
@@ -26,8 +26,11 @@
 import org.apache.druid.catalog.model.table.HttpTableDefn;
 import org.apache.druid.catalog.model.table.InlineTableDefn;
 import org.apache.druid.catalog.model.table.LocalTableDefn;
+import org.apache.druid.guice.annotations.Json;
 import org.apache.druid.java.util.common.IAE;
 
+import javax.inject.Inject;
+
 import java.util.Map;
 
 /**
@@ -75,8 +78,9 @@ public TableDefnRegistry(
     this.jsonMapper = jsonMapper;
   }
 
+  @Inject
   public TableDefnRegistry(
-      final ObjectMapper jsonMapper
+      @Json ObjectMapper jsonMapper
   )
   {
     this(TABLE_DEFNS, jsonMapper);
diff --git a/server/src/main/java/org/apache/druid/catalog/model/table/AbstractDatasourceDefn.java b/server/src/main/java/org/apache/druid/catalog/model/table/AbstractDatasourceDefn.java
index bbfc2d5042cd..3c67b7808c5c 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/table/AbstractDatasourceDefn.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/table/AbstractDatasourceDefn.java
@@ -70,7 +70,7 @@ public static class SegmentGranularityFieldDefn extends GranularityPropertyDefn
   {
     public SegmentGranularityFieldDefn()
     {
-      super(SEGMENT_GRANULARITY_PROPERTY);
+      super(SEGMENT_GRANULARITY_PROPERTY, null);
     }
 
     @Override
@@ -88,7 +88,7 @@ public static class HiddenColumnsDefn extends StringListPropertyDefn
   {
     public HiddenColumnsDefn()
     {
-      super(HIDDEN_COLUMNS_PROPERTY);
+      super(HIDDEN_COLUMNS_PROPERTY, null);
     }
 
     @Override
@@ -121,11 +121,12 @@ public AbstractDatasourceDefn(
         CatalogUtils.concatLists(
             Arrays.asList(
                 new SegmentGranularityFieldDefn(),
-                new ModelProperties.IntPropertyDefn(TARGET_SEGMENT_ROWS_PROPERTY),
+                new ModelProperties.IntPropertyDefn(TARGET_SEGMENT_ROWS_PROPERTY, null),
                 new ModelProperties.ListPropertyDefn<ClusterKeySpec>(
                     CLUSTER_KEYS_PROPERTY,
                     "cluster keys",
-                    new TypeReference<List<ClusterKeySpec>>() { }
+                    new TypeReference<List<ClusterKeySpec>>() { },
+                    null
                 ),
                 new HiddenColumnsDefn()
             ),
diff --git a/server/src/main/java/org/apache/druid/catalog/model/table/ExternalTableDefn.java b/server/src/main/java/org/apache/druid/catalog/model/table/ExternalTableDefn.java
index e808d1833e64..dfcdc75f6e7e 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/table/ExternalTableDefn.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/table/ExternalTableDefn.java
@@ -26,9 +26,10 @@
 import org.apache.druid.catalog.model.ColumnDefn;
 import org.apache.druid.catalog.model.ColumnSpec;
 import org.apache.druid.catalog.model.Columns;
+import org.apache.druid.catalog.model.ModelProperties;
 import org.apache.druid.catalog.model.ModelProperties.PropertyDefn;
 import org.apache.druid.catalog.model.ParameterizedDefn;
-import org.apache.druid.catalog.model.ParameterizedDefn.ParameterDefn;
+import org.apache.druid.catalog.model.PropertyAttributes;
 import org.apache.druid.catalog.model.ResolvedTable;
 import org.apache.druid.catalog.model.TableDefn;
 import org.apache.druid.catalog.model.table.InputFormats.InputFormatDefn;
@@ -36,13 +37,13 @@
 import org.apache.druid.data.input.InputSource;
 import org.apache.druid.java.util.common.IAE;
 import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.utils.CollectionUtils;
 
 import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.Set;
+import java.util.stream.Collectors;
 
 /**
  * Definition of an external input source, primarily for ingestion.
@@ -70,16 +71,14 @@ public FormattedExternalTableDefn(
         final String typeValue,
         final List<PropertyDefn<?>> properties,
         final List<ColumnDefn> columnDefns,
-        final List<InputFormatDefn> formats,
-        final List<ParameterDefn> parameters
+        final List<InputFormatDefn> formats
     )
     {
       super(
           name,
           typeValue,
           addFormatProperties(properties, formats),
-          columnDefns,
-          parameters
+          columnDefns
       );
       ImmutableMap.Builder<String, InputFormatDefn> builder = ImmutableMap.builder();
       for (InputFormatDefn format : formats) {
@@ -99,6 +98,8 @@ private static List<PropertyDefn<?>> addFormatProperties(
     )
     {
       List<PropertyDefn<?>> toAdd = new ArrayList<>();
+      PropertyDefn<?> formatProp = new ModelProperties.StringPropertyDefn(FORMAT_PROPERTY, PropertyAttributes.SQL_FN_PARAM);
+      toAdd.add(formatProp);
       Map<String, PropertyDefn<?>> formatProps = new HashMap<>();
       for (InputFormatDefn format : formats) {
         for (PropertyDefn<?> prop : format.properties()) {
@@ -180,41 +181,32 @@ public void validate(ColumnSpec spec, ObjectMapper jsonMapper)
   }
 
   protected static final ExternalColumnDefn INPUT_COLUMN_DEFN = new ExternalColumnDefn();
-  private final List<ParameterDefn> parameterList;
-  private final Map<String, ParameterDefn> parameterMap;
+
+  private final List<PropertyDefn<?>> fields;
 
   public ExternalTableDefn(
       final String name,
       final String typeValue,
       final List<PropertyDefn<?>> fields,
-      final List<ColumnDefn> columnDefns,
-      final List<ParameterDefn> parameters
+      final List<ColumnDefn> columnDefns
   )
   {
     super(name, typeValue, fields, columnDefns);
-    if (CollectionUtils.isNullOrEmpty(parameters)) {
-      this.parameterMap = null;
-      this.parameterList = null;
-    } else {
-      this.parameterList = parameters;
-      Map<String, ParameterDefn> params = new HashMap<>();
-      for (ParameterDefn param : parameters) {
-        if (params.put(param.name(), param) != null) {
-          throw new ISE("Duplicate parameter: %s", param.name());
-        }
-      }
-      this.parameterMap = ImmutableMap.copyOf(params);
-    }
+    this.fields = fields;
   }
 
-  public List<ParameterDefn> parameters()
+  public List<PropertyDefn<?>> parameters()
   {
-    return parameterList;
+    return fields.stream()
+        .filter(f -> PropertyAttributes.isExternTableParameter(f))
+        .collect(Collectors.toList());
   }
 
-  public ParameterDefn parameter(String key)
+  public List<PropertyDefn<?>> tableFunctionParameters()
   {
-    return parameterMap.get(key);
+    return fields.stream()
+        .filter(f -> PropertyAttributes.isSqlFunctionParameter(f))
+        .collect(Collectors.toList());
   }
 
   /**
diff --git a/server/src/main/java/org/apache/druid/catalog/model/table/ExternalTableSpec.java b/server/src/main/java/org/apache/druid/catalog/model/table/ExternalTableSpec.java
index 588e5e6b03a2..c0697bec4d70 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/table/ExternalTableSpec.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/table/ExternalTableSpec.java
@@ -23,16 +23,19 @@
 import org.apache.druid.data.input.InputSource;
 import org.apache.druid.segment.column.RowSignature;
 
+import javax.annotation.Nullable;
+
 /**
- * Catalog form of an external table specification used to
- * pass along the three components needed for an external table
- * in MSQ ingest.
+ * Catalog form of an external table specification used to pass along the three
+ * components needed for an external table in MSQ ingest. Just like
+ * {@code ExternalTableSource}, except that the parameters are not required
+ * to be non-null.
  */
 public class ExternalTableSpec
 {
-  protected final InputSource inputSource;
-  protected final InputFormat inputFormat;
-  protected final RowSignature signature;
+  @Nullable public final InputSource inputSource;
+  @Nullable public final InputFormat inputFormat;
+  @Nullable public final RowSignature signature;
 
   public ExternalTableSpec(
       final InputSource inputSource,
@@ -43,19 +46,4 @@ public ExternalTableSpec(
     this.inputFormat = inputFormat;
     this.signature = signature;
   }
-
-  public InputSource inputSource()
-  {
-    return inputSource;
-  }
-
-  public InputFormat inputFormat()
-  {
-    return inputFormat;
-  }
-
-  public RowSignature signature()
-  {
-    return signature;
-  }
 }
diff --git a/server/src/main/java/org/apache/druid/catalog/model/table/HttpTableDefn.java b/server/src/main/java/org/apache/druid/catalog/model/table/HttpTableDefn.java
index eb97cc744f20..dcfe64ee2dbb 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/table/HttpTableDefn.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/table/HttpTableDefn.java
@@ -25,6 +25,7 @@
 import org.apache.druid.catalog.model.ModelProperties.StringListPropertyDefn;
 import org.apache.druid.catalog.model.ModelProperties.StringPropertyDefn;
 import org.apache.druid.catalog.model.ParameterizedDefn;
+import org.apache.druid.catalog.model.PropertyAttributes;
 import org.apache.druid.catalog.model.ResolvedTable;
 import org.apache.druid.catalog.model.table.ExternalTableDefn.FormattedExternalTableDefn;
 import org.apache.druid.data.input.InputSource;
@@ -52,7 +53,7 @@
  * properties as the {@link HttpInputSource}, but as top-level properties
  * that can be mapped to SQL function parameters. Property names are
  * cleaned up for ease-of-use. The HTTP input source has multiple quirks,
- * the conversion method smooths over those quirks for a simpler catalog
+ * the conversion method smoothes over those quirks for a simpler catalog
  * experience. Provides a parameterized
  * form where the user provides the partial URLs to use for a particular
  * query.
@@ -65,11 +66,13 @@ public class HttpTableDefn extends FormattedExternalTableDefn implements Paramet
   // that class for the meaning of these properties.
 
   public static final String URI_TEMPLATE_PROPERTY = "uriTemplate";
-  public static final String USER_PROPERTY = "user";
+
+  // Note, cannot be the simpler "user" since USER is a reserved word in SQL
+  // and we don't want to require users to quote "user" each time it is used.
+  public static final String USER_PROPERTY = "userName";
   public static final String PASSWORD_PROPERTY = "password";
   public static final String PASSWORD_ENV_VAR_PROPERTY = "passwordEnvVar";
   public static final String URIS_PROPERTY = "uris";
-  public static final String URIS_PARAMETER = "uris";
 
   public HttpTableDefn()
   {
@@ -77,27 +80,24 @@ public HttpTableDefn()
         "HTTP input table",
         TABLE_TYPE,
         Arrays.asList(
-            new StringListPropertyDefn(URIS_PROPERTY),
-            new StringPropertyDefn(USER_PROPERTY),
-            new StringPropertyDefn(PASSWORD_PROPERTY),
-            new StringPropertyDefn(PASSWORD_ENV_VAR_PROPERTY),
-            new StringPropertyDefn(URI_TEMPLATE_PROPERTY)
+            new StringListPropertyDefn(URIS_PROPERTY, PropertyAttributes.SQL_AND_TABLE_PARAM),
+            new StringPropertyDefn(USER_PROPERTY, PropertyAttributes.OPTIONAL_SQL_FN_PARAM),
+            new StringPropertyDefn(PASSWORD_PROPERTY, PropertyAttributes.OPTIONAL_SQL_FN_PARAM),
+            new StringPropertyDefn(PASSWORD_ENV_VAR_PROPERTY, PropertyAttributes.OPTIONAL_SQL_FN_PARAM),
+            new StringPropertyDefn(URI_TEMPLATE_PROPERTY, null)
         ),
         Collections.singletonList(INPUT_COLUMN_DEFN),
-        InputFormats.ALL_FORMATS,
-        Collections.singletonList(
-            new ParameterImpl(URIS_PARAMETER, String.class)
-        )
+        InputFormats.ALL_FORMATS
     );
   }
 
   @Override
   public ResolvedTable mergeParameters(ResolvedTable table, Map<String, Object> values)
   {
-    String urisValue = CatalogUtils.safeGet(values, URIS_PARAMETER, String.class);
+    String urisValue = CatalogUtils.safeGet(values, URIS_PROPERTY, String.class);
     List<String> uriValues = CatalogUtils.stringToList(urisValue);
     if (CollectionUtils.isNullOrEmpty(uriValues)) {
-      throw new IAE("One or more values are required for parameter %s", URIS_PARAMETER);
+      throw new IAE("One or more values are required for parameter %s", URIS_PROPERTY);
     }
     String uriTemplate = table.stringProperty(URI_TEMPLATE_PROPERTY);
     if (Strings.isNullOrEmpty(uriTemplate)) {
diff --git a/server/src/main/java/org/apache/druid/catalog/model/table/InlineTableDefn.java b/server/src/main/java/org/apache/druid/catalog/model/table/InlineTableDefn.java
index 273aad2696d9..7301141fff4f 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/table/InlineTableDefn.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/table/InlineTableDefn.java
@@ -19,16 +19,20 @@
 
 package org.apache.druid.catalog.model.table;
 
+import com.fasterxml.jackson.databind.ObjectMapper;
 import org.apache.druid.catalog.model.CatalogUtils;
 import org.apache.druid.catalog.model.ModelProperties.StringListPropertyDefn;
+import org.apache.druid.catalog.model.PropertyAttributes;
 import org.apache.druid.catalog.model.ResolvedTable;
 import org.apache.druid.catalog.model.table.ExternalTableDefn.FormattedExternalTableDefn;
 import org.apache.druid.data.input.InputSource;
 import org.apache.druid.data.input.impl.InlineInputSource;
 import org.apache.druid.java.util.common.IAE;
+import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.UOE;
 import org.apache.druid.utils.CollectionUtils;
 
+import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
@@ -43,17 +47,41 @@ public class InlineTableDefn extends FormattedExternalTableDefn
   public static final String TABLE_TYPE = InlineInputSource.TYPE_KEY;
   public static final String DATA_PROPERTY = "data";
 
+  /**
+   * Special handling of the data property which, in SQL, is a null-delimited
+   * list of rows. The user will usually provide a trailing newline which should
+   * not be interpreted as an empty data row.
+   */
+  private static class DataPropertyDefn extends StringListPropertyDefn
+  {
+    public DataPropertyDefn(
+        final Map<String, Object> attribs
+    )
+    {
+      super(DATA_PROPERTY, attribs);
+    }
+
+    @Override
+    public List<String> decodeSqlValue(Object value, ObjectMapper jsonMapper)
+    {
+      if (!(value instanceof String)) {
+        throw new IAE(StringUtils.format("Argument [%s] is not a VARCHAR", value));
+      }
+      String[] values = ((String) value).trim().split("\n");
+      return Arrays.asList(values);
+    }
+  }
+
   public InlineTableDefn()
   {
     super(
         "Inline input table",
         TABLE_TYPE,
         Collections.singletonList(
-            new StringListPropertyDefn(DATA_PROPERTY)
+            new DataPropertyDefn(PropertyAttributes.SQL_FN_PARAM)
         ),
         Collections.singletonList(INPUT_COLUMN_DEFN),
-        InputFormats.ALL_FORMATS,
-        null
+        InputFormats.ALL_FORMATS
     );
   }
 
diff --git a/server/src/main/java/org/apache/druid/catalog/model/table/InputFormats.java b/server/src/main/java/org/apache/druid/catalog/model/table/InputFormats.java
index 9d1235aac862..c7a03ae8c009 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/table/InputFormats.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/table/InputFormats.java
@@ -19,6 +19,8 @@
 
 package org.apache.druid.catalog.model.table;
 
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.collect.ImmutableMap;
 import org.apache.curator.shaded.com.google.common.collect.ImmutableList;
 import org.apache.druid.catalog.model.CatalogUtils;
 import org.apache.druid.catalog.model.ModelProperties.BooleanPropertyDefn;
@@ -26,6 +28,7 @@
 import org.apache.druid.catalog.model.ModelProperties.PropertyDefn;
 import org.apache.druid.catalog.model.ModelProperties.SimplePropertyDefn;
 import org.apache.druid.catalog.model.ModelProperties.StringPropertyDefn;
+import org.apache.druid.catalog.model.PropertyAttributes;
 import org.apache.druid.catalog.model.ResolvedTable;
 import org.apache.druid.data.input.InputFormat;
 import org.apache.druid.data.input.impl.CsvInputFormat;
@@ -127,8 +130,8 @@ public FlatTextFormatDefn(
           typeTag,
           CatalogUtils.concatLists(
               Arrays.asList(
-                  new StringPropertyDefn(LIST_DELIMITER_PROPERTY),
-                  new IntPropertyDefn(SKIP_ROWS_PROPERTY)
+                  new StringPropertyDefn(LIST_DELIMITER_PROPERTY, PropertyAttributes.OPTIONAL_SQL_FN_PARAM),
+                  new IntPropertyDefn(SKIP_ROWS_PROPERTY, PropertyAttributes.OPTIONAL_SQL_FN_PARAM)
               ),
               properties
           )
@@ -200,7 +203,7 @@ public DelimitedFormatDefn()
           "Delimited Text",
           DELIMITED_FORMAT_TYPE,
           Collections.singletonList(
-              new StringPropertyDefn(DELIMITER_PROPERTY)
+              new StringPropertyDefn(DELIMITER_PROPERTY, PropertyAttributes.OPTIONAL_SQL_FN_PARAM)
           )
       );
     }
@@ -236,7 +239,7 @@ public JsonFormatDefn()
           "JSON",
           JSON_FORMAT_TYPE,
           Collections.singletonList(
-              new BooleanPropertyDefn(KEEP_NULLS_PROPERTY)
+              new BooleanPropertyDefn(KEEP_NULLS_PROPERTY, PropertyAttributes.OPTIONAL_SQL_FN_PARAM)
           )
       );
     }
@@ -262,13 +265,37 @@ public static class GenericFormatDefn extends BaseFormatDefn
     public static final String INPUT_FORMAT_SPEC_PROPERTY = "inputFormatSpec";
     public static final String FORMAT_KEY = "generic";
 
+    private static class FormatPropertyDefn extends SimplePropertyDefn<InputFormat>
+    {
+      public FormatPropertyDefn()
+      {
+        super(
+            INPUT_FORMAT_SPEC_PROPERTY,
+            InputFormat.class,
+            PropertyAttributes.merge(
+                ImmutableMap.of(
+                    PropertyAttributes.SQL_JAVA_TYPE,
+                    String.class
+                ),
+                PropertyAttributes.OPTIONAL_SQL_FN_PARAM
+            )
+        );
+      }
+
+      @Override
+      public InputFormat decodeSqlValue(Object value, ObjectMapper jsonMapper)
+      {
+        return decodeJson(value, jsonMapper);
+      }
+    }
+
     public GenericFormatDefn()
     {
       super(
           "Generic",
           FORMAT_KEY,
           Collections.singletonList(
-              new SimplePropertyDefn<InputFormat>(INPUT_FORMAT_SPEC_PROPERTY, InputFormat.class)
+              new FormatPropertyDefn()
           )
       );
     }
diff --git a/server/src/main/java/org/apache/druid/catalog/model/table/LocalTableDefn.java b/server/src/main/java/org/apache/druid/catalog/model/table/LocalTableDefn.java
index 48992483dd53..142d211dfb76 100644
--- a/server/src/main/java/org/apache/druid/catalog/model/table/LocalTableDefn.java
+++ b/server/src/main/java/org/apache/druid/catalog/model/table/LocalTableDefn.java
@@ -23,6 +23,7 @@
 import org.apache.druid.catalog.model.ModelProperties.StringListPropertyDefn;
 import org.apache.druid.catalog.model.ModelProperties.StringPropertyDefn;
 import org.apache.druid.catalog.model.ParameterizedDefn;
+import org.apache.druid.catalog.model.PropertyAttributes;
 import org.apache.druid.catalog.model.ResolvedTable;
 import org.apache.druid.catalog.model.table.ExternalTableDefn.FormattedExternalTableDefn;
 import org.apache.druid.data.input.InputSource;
@@ -61,16 +62,12 @@ public LocalTableDefn()
         "Local file input table",
         TABLE_TYPE,
         Arrays.asList(
-            new StringPropertyDefn(BASE_DIR_PROPERTY),
-            new StringPropertyDefn(FILE_FILTER_PROPERTY),
-            new StringListPropertyDefn(FILES_PROPERTY)
+            new StringPropertyDefn(BASE_DIR_PROPERTY, PropertyAttributes.OPTIONAL_SQL_FN_PARAM),
+            new StringPropertyDefn(FILE_FILTER_PROPERTY, PropertyAttributes.OPTIONAL_SQL_FN_PARAM),
+            new StringListPropertyDefn(FILES_PROPERTY, PropertyAttributes.SQL_AND_TABLE_PARAM)
         ),
         Collections.singletonList(INPUT_COLUMN_DEFN),
-        InputFormats.ALL_FORMATS,
-        Arrays.asList(
-            new ParameterImpl(FILE_FILTER_PROPERTY, String.class),
-            new ParameterImpl(FILES_PROPERTY, String.class)
-        )
+        InputFormats.ALL_FORMATS
     );
   }
 
@@ -78,9 +75,9 @@ public LocalTableDefn()
   public ResolvedTable mergeParameters(ResolvedTable table, Map<String, Object> values)
   {
     // The safe get can only check
-    String filesParam = CatalogUtils.safeGet(values, FILES_PROPERTY, String.class);
-    String filterParam = CatalogUtils.safeGet(values, FILE_FILTER_PROPERTY, String.class);
-    Map<String, Object> revisedProps = new HashMap<>(table.properties());
+    final String filesParam = CatalogUtils.safeGet(values, FILES_PROPERTY, String.class);
+    final String filterParam = CatalogUtils.safeGet(values, FILE_FILTER_PROPERTY, String.class);
+    final Map<String, Object> revisedProps = new HashMap<>(table.properties());
     if (filesParam != null) {
       revisedProps.put(FILES_PROPERTY, CatalogUtils.stringToList(filesParam));
     }
@@ -93,11 +90,11 @@ public ResolvedTable mergeParameters(ResolvedTable table, Map<String, Object> va
   @Override
   protected InputSource convertSource(ResolvedTable table)
   {
-    Map<String, Object> jsonMap = new HashMap<>();
+    final Map<String, Object> jsonMap = new HashMap<>();
     jsonMap.put(InputSource.TYPE_PROPERTY, LocalInputSource.TYPE_KEY);
-    String baseDir = table.stringProperty(BASE_DIR_PROPERTY);
+    final String baseDir = table.stringProperty(BASE_DIR_PROPERTY);
     jsonMap.put("baseDir", baseDir);
-    List<String> files = table.stringListProperty(FILES_PROPERTY);
+    final List<String> files = table.stringListProperty(FILES_PROPERTY);
     jsonMap.put("files", files);
 
     // Note the odd semantics of this class.
diff --git a/server/src/main/java/org/apache/druid/client/CachingClusteredClient.java b/server/src/main/java/org/apache/druid/client/CachingClusteredClient.java
index de5fdc5db194..52b36a0276e5 100644
--- a/server/src/main/java/org/apache/druid/client/CachingClusteredClient.java
+++ b/server/src/main/java/org/apache/druid/client/CachingClusteredClient.java
@@ -403,12 +403,17 @@ private Sequence<T> merge(List<Sequence<T>> sequencesByInterval)
               QueryMetrics<?> queryMetrics = queryPlus.getQueryMetrics();
               if (queryMetrics != null) {
                 queryMetrics.parallelMergeParallelism(reportMetrics.getParallelism());
-                queryMetrics.reportParallelMergeParallelism(reportMetrics.getParallelism());
-                queryMetrics.reportParallelMergeInputSequences(reportMetrics.getInputSequences());
-                queryMetrics.reportParallelMergeInputRows(reportMetrics.getInputRows());
-                queryMetrics.reportParallelMergeOutputRows(reportMetrics.getOutputRows());
-                queryMetrics.reportParallelMergeTaskCount(reportMetrics.getTaskCount());
-                queryMetrics.reportParallelMergeTotalCpuTime(reportMetrics.getTotalCpuTime());
+                queryMetrics.reportParallelMergeParallelism(reportMetrics.getParallelism()).emit(emitter);
+                queryMetrics.reportParallelMergeInputSequences(reportMetrics.getInputSequences()).emit(emitter);
+                queryMetrics.reportParallelMergeInputRows(reportMetrics.getInputRows()).emit(emitter);
+                queryMetrics.reportParallelMergeOutputRows(reportMetrics.getOutputRows()).emit(emitter);
+                queryMetrics.reportParallelMergeTaskCount(reportMetrics.getTaskCount()).emit(emitter);
+                queryMetrics.reportParallelMergeTotalCpuTime(reportMetrics.getTotalCpuTime()).emit(emitter);
+                queryMetrics.reportParallelMergeTotalTime(reportMetrics.getTotalTime()).emit(emitter);
+                queryMetrics.reportParallelMergeSlowestPartitionTime(reportMetrics.getSlowestPartitionInitializedTime())
+                            .emit(emitter);
+                queryMetrics.reportParallelMergeFastestPartitionTime(reportMetrics.getFastestPartitionInitializedTime())
+                            .emit(emitter);
               }
             }
         );
@@ -884,7 +889,6 @@ private PartitionChunkEntry<String, ServerSelector> toChunkEntry(
         return null;
       }
       return new PartitionChunkEntry<>(spec.getInterval(), spec.getVersion(), chunk);
-
     }
   }
 }
diff --git a/server/src/main/java/org/apache/druid/client/cache/CaffeineCache.java b/server/src/main/java/org/apache/druid/client/cache/CaffeineCache.java
index b7a1ea826c58..362a387231a6 100644
--- a/server/src/main/java/org/apache/druid/client/cache/CaffeineCache.java
+++ b/server/src/main/java/org/apache/druid/client/cache/CaffeineCache.java
@@ -70,7 +70,7 @@ public static CaffeineCache create(final CaffeineCacheConfig config, final Execu
     if (config.getSizeInBytes() >= 0) {
       builder.maximumWeight(config.getSizeInBytes());
     } else {
-      builder.maximumWeight(Math.min(MAX_DEFAULT_BYTES, JvmUtils.getRuntimeInfo().getMaxHeapSizeBytes() / 10));
+      builder.maximumWeight(Math.min(MAX_DEFAULT_BYTES, JvmUtils.getRuntimeInfo().getMaxHeapSizeBytes() / 20));
     }
     builder
         .weigher((NamedKey key, byte[] value) -> value.length
diff --git a/server/src/main/java/org/apache/druid/curator/CuratorModule.java b/server/src/main/java/org/apache/druid/curator/CuratorModule.java
index 665024fd7716..07c0ad84780e 100644
--- a/server/src/main/java/org/apache/druid/curator/CuratorModule.java
+++ b/server/src/main/java/org/apache/druid/curator/CuratorModule.java
@@ -30,6 +30,7 @@
 import org.apache.curator.framework.imps.DefaultACLProvider;
 import org.apache.curator.retry.BoundedExponentialBackoffRetry;
 import org.apache.curator.shaded.com.google.common.base.Strings;
+import org.apache.druid.concurrent.Threads;
 import org.apache.druid.guice.JsonConfigProvider;
 import org.apache.druid.guice.LazySingleton;
 import org.apache.druid.java.util.common.StringUtils;
@@ -40,6 +41,7 @@
 
 import java.nio.charset.StandardCharsets;
 import java.util.List;
+import java.util.concurrent.TimeUnit;
 
 public class CuratorModule implements Module
 {
@@ -49,6 +51,23 @@ public class CuratorModule implements Module
   static final int MAX_SLEEP_TIME_MS = 45000;
   private static final int MAX_RETRIES = 29;
 
+  private final boolean haltOnFailedStart;
+
+  public CuratorModule()
+  {
+    this(true);
+  }
+
+  /**
+   *
+   * @param haltOnFailedStart set to true if the JVM needs to be halted within 30 seconds of failed initialization
+   *                          due to unhandled curator exceptions.
+   */
+  public CuratorModule(boolean haltOnFailedStart)
+  {
+    this.haltOnFailedStart = haltOnFailedStart;
+  }
+
   @Override
   public void configure(Binder binder)
   {
@@ -97,6 +116,29 @@ public CuratorFramework makeCurator(ZkEnablementConfig zkEnablementConfig, Curat
 
     framework.getUnhandledErrorListenable().addListener((message, e) -> {
       log.error(e, "Unhandled error in Curator, stopping server.");
+
+      if (haltOnFailedStart) {
+        final long startTime = System.currentTimeMillis();
+        final Thread halter = new Thread(
+            () -> {
+              try {
+                Threads.sleepFor(30, TimeUnit.SECONDS);
+              }
+              catch (InterruptedException ignored) {
+
+              }
+              log.warn(
+                  "Could not stop server within %,d millis after unhandled Curator error. Halting immediately.",
+                  System.currentTimeMillis() - startTime
+              );
+              Runtime.getRuntime().halt(1);
+            },
+            "exiter-thread"
+        );
+        halter.setDaemon(true);
+        halter.start();
+      }
+
       shutdown(lifecycle);
     });
 
diff --git a/server/src/main/java/org/apache/druid/guice/AnnouncerModule.java b/server/src/main/java/org/apache/druid/guice/AnnouncerModule.java
index 97a468542237..6b0c96641a65 100644
--- a/server/src/main/java/org/apache/druid/guice/AnnouncerModule.java
+++ b/server/src/main/java/org/apache/druid/guice/AnnouncerModule.java
@@ -54,7 +54,7 @@ public void configure(Binder binder)
     JsonConfigProvider.bind(binder, "druid.announcer", BatchDataSegmentAnnouncerConfig.class);
     JsonConfigProvider.bind(binder, "druid.announcer", DataSegmentAnnouncerProvider.class);
     binder.bind(DataSegmentAnnouncer.class).toProvider(DataSegmentAnnouncerProvider.class);
-    binder.bind(BatchDataSegmentAnnouncer.class).in(LazySingleton.class);
+    binder.bind(BatchDataSegmentAnnouncer.class).in(ManageLifecycleAnnouncements.class);
 
     if (isZkEnabled) {
       binder.bind(DataSegmentServerAnnouncer.class).to(CuratorDataSegmentServerAnnouncer.class).in(LazySingleton.class);
diff --git a/server/src/main/java/org/apache/druid/guice/DruidInjectorBuilder.java b/server/src/main/java/org/apache/druid/guice/DruidInjectorBuilder.java
index 81e28431e2db..b650c100669a 100644
--- a/server/src/main/java/org/apache/druid/guice/DruidInjectorBuilder.java
+++ b/server/src/main/java/org/apache/druid/guice/DruidInjectorBuilder.java
@@ -61,6 +61,7 @@ public class DruidInjectorBuilder
   private final ObjectMapper smileMapper;
   private final Set<NodeRole> nodeRoles;
   private final ModulesConfig modulesConfig;
+  private boolean ignoreLoadScopes;
 
   public DruidInjectorBuilder(final Injector baseInjector)
   {
@@ -83,6 +84,18 @@ public DruidInjectorBuilder(final DruidInjectorBuilder from)
     this.modulesConfig = from.modulesConfig;
     this.jsonMapper = from.jsonMapper;
     this.smileMapper = from.smileMapper;
+    this.ignoreLoadScopes = from.ignoreLoadScopes;
+  }
+
+  /**
+   * Ignore load scope annotations on modules. Primarily for testing where a unit
+   * test is not any Druid node, and may wish to load a module that is annotated
+   * with a load scope.
+   */
+  public DruidInjectorBuilder ignoreLoadScopes()
+  {
+    this.ignoreLoadScopes = true;
+    return this;
   }
 
   /**
@@ -127,7 +140,7 @@ public DruidInjectorBuilder addInput(Object input)
     } else if (input instanceof Class) {
       return addClass((Class<?>) input);
     } else {
-      throw new ISE("Unknown module type[%s]", input.getClass());
+      throw new ISE("Unknown module type [%s]", input.getClass());
     }
   }
 
@@ -176,6 +189,12 @@ private boolean acceptModule(Class<?> moduleClass)
       log.info("Not loading module [%s] because it is present in excludeList", moduleClassName);
       return false;
     }
+
+    // Tests don't have node roles, and so want to load the given modules
+    // regardless of the node roles provided.
+    if (ignoreLoadScopes) {
+      return true;
+    }
     LoadScope loadScope = moduleClass.getAnnotation(LoadScope.class);
     if (loadScope == null) {
       // always load if annotation is not specified
@@ -204,4 +223,9 @@ public Injector build()
   {
     return Guice.createInjector(modules);
   }
+
+  public Injector baseInjector()
+  {
+    return baseInjector;
+  }
 }
diff --git a/server/src/main/java/org/apache/druid/guice/QueryRunnerFactoryModule.java b/server/src/main/java/org/apache/druid/guice/QueryRunnerFactoryModule.java
index 102c72d890cc..a2fe8f8d2a58 100644
--- a/server/src/main/java/org/apache/druid/guice/QueryRunnerFactoryModule.java
+++ b/server/src/main/java/org/apache/druid/guice/QueryRunnerFactoryModule.java
@@ -35,6 +35,8 @@
 import org.apache.druid.query.groupby.GroupByQueryRunnerFactory;
 import org.apache.druid.query.metadata.SegmentMetadataQueryRunnerFactory;
 import org.apache.druid.query.metadata.metadata.SegmentMetadataQuery;
+import org.apache.druid.query.operator.WindowOperatorQuery;
+import org.apache.druid.query.operator.WindowOperatorQueryQueryRunnerFactory;
 import org.apache.druid.query.scan.ScanQuery;
 import org.apache.druid.query.scan.ScanQueryRunnerFactory;
 import org.apache.druid.query.search.SearchQuery;
@@ -56,14 +58,15 @@ public class QueryRunnerFactoryModule extends QueryToolChestModule
 {
   private static final Map<Class<? extends Query<?>>, Class<? extends QueryRunnerFactory<?, ?>>> MAPPINGS =
       ImmutableMap.<Class<? extends Query<?>>, Class<? extends QueryRunnerFactory<?, ?>>>builder()
-                  .put(TimeseriesQuery.class, TimeseriesQueryRunnerFactory.class)
-                  .put(SearchQuery.class, SearchQueryRunnerFactory.class)
-                  .put(TimeBoundaryQuery.class, TimeBoundaryQueryRunnerFactory.class)
-                  .put(SegmentMetadataQuery.class, SegmentMetadataQueryRunnerFactory.class)
+                  .put(DataSourceMetadataQuery.class, DataSourceMetadataQueryRunnerFactory.class)
                   .put(GroupByQuery.class, GroupByQueryRunnerFactory.class)
                   .put(ScanQuery.class, ScanQueryRunnerFactory.class)
+                  .put(SearchQuery.class, SearchQueryRunnerFactory.class)
+                  .put(SegmentMetadataQuery.class, SegmentMetadataQueryRunnerFactory.class)
+                  .put(TimeBoundaryQuery.class, TimeBoundaryQueryRunnerFactory.class)
+                  .put(TimeseriesQuery.class, TimeseriesQueryRunnerFactory.class)
                   .put(TopNQuery.class, TopNQueryRunnerFactory.class)
-                  .put(DataSourceMetadataQuery.class, DataSourceMetadataQueryRunnerFactory.class)
+                  .put(WindowOperatorQuery.class, WindowOperatorQueryQueryRunnerFactory.class)
                   .build();
 
   @Override
diff --git a/server/src/main/java/org/apache/druid/guice/QueryToolChestModule.java b/server/src/main/java/org/apache/druid/guice/QueryToolChestModule.java
index edb892b03a95..da9ab41e299c 100644
--- a/server/src/main/java/org/apache/druid/guice/QueryToolChestModule.java
+++ b/server/src/main/java/org/apache/druid/guice/QueryToolChestModule.java
@@ -41,6 +41,8 @@
 import org.apache.druid.query.metadata.SegmentMetadataQueryConfig;
 import org.apache.druid.query.metadata.SegmentMetadataQueryQueryToolChest;
 import org.apache.druid.query.metadata.metadata.SegmentMetadataQuery;
+import org.apache.druid.query.operator.WindowOperatorQuery;
+import org.apache.druid.query.operator.WindowOperatorQueryQueryToolChest;
 import org.apache.druid.query.scan.ScanQuery;
 import org.apache.druid.query.scan.ScanQueryConfig;
 import org.apache.druid.query.scan.ScanQueryQueryToolChest;
@@ -75,14 +77,15 @@ public class QueryToolChestModule implements Module
 
   public final Map<Class<? extends Query>, Class<? extends QueryToolChest>> mappings =
       ImmutableMap.<Class<? extends Query>, Class<? extends QueryToolChest>>builder()
-                  .put(TimeseriesQuery.class, TimeseriesQueryQueryToolChest.class)
-                  .put(SearchQuery.class, SearchQueryQueryToolChest.class)
-                  .put(TimeBoundaryQuery.class, TimeBoundaryQueryQueryToolChest.class)
-                  .put(SegmentMetadataQuery.class, SegmentMetadataQueryQueryToolChest.class)
+                  .put(DataSourceMetadataQuery.class, DataSourceQueryQueryToolChest.class)
                   .put(GroupByQuery.class, GroupByQueryQueryToolChest.class)
                   .put(ScanQuery.class, ScanQueryQueryToolChest.class)
+                  .put(SearchQuery.class, SearchQueryQueryToolChest.class)
+                  .put(SegmentMetadataQuery.class, SegmentMetadataQueryQueryToolChest.class)
+                  .put(TimeBoundaryQuery.class, TimeBoundaryQueryQueryToolChest.class)
+                  .put(TimeseriesQuery.class, TimeseriesQueryQueryToolChest.class)
                   .put(TopNQuery.class, TopNQueryQueryToolChest.class)
-                  .put(DataSourceMetadataQuery.class, DataSourceQueryQueryToolChest.class)
+                  .put(WindowOperatorQuery.class, WindowOperatorQueryQueryToolChest.class)
                   .build();
 
   @Override
diff --git a/server/src/main/java/org/apache/druid/guice/StorageNodeModule.java b/server/src/main/java/org/apache/druid/guice/StorageNodeModule.java
index a232f6d01aac..842abd0e5347 100644
--- a/server/src/main/java/org/apache/druid/guice/StorageNodeModule.java
+++ b/server/src/main/java/org/apache/druid/guice/StorageNodeModule.java
@@ -101,7 +101,7 @@ public DataNodeService getDataNodeService(
           serverTypeConfig.getServerType()
       );
       if (ServerType.HISTORICAL.equals(serverTypeConfig.getServerType())) {
-        throw new ProvisionException("Segment cache locations must be set on historicals.");
+        throw new ProvisionException("druid.segmentCache.locations must be set on historicals.");
       }
     }
 
diff --git a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
index acb617f78a4c..b3c70f0cdbe9 100644
--- a/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/indexing/overlord/IndexerMetadataStorageCoordinator.java
@@ -31,6 +31,7 @@
 import java.util.Collection;
 import java.util.Collections;
 import java.util.List;
+import java.util.Map;
 import java.util.Set;
 
 /**
@@ -154,6 +155,27 @@ Collection<DataSegment> retrieveUsedSegmentsForIntervals(
    */
   Set<DataSegment> announceHistoricalSegments(Set<DataSegment> segments) throws IOException;
 
+  /**
+   * Allocates pending segments for the given requests in the pending segments table.
+   * The segment id allocated for a request will not be given out again unless a
+   * request is made with the same {@link SegmentCreateRequest}.
+   *
+   * @param dataSource              dataSource for which to allocate a segment
+   * @param interval                interval for which to allocate a segment
+   * @param skipSegmentLineageCheck if true, perform lineage validation using previousSegmentId for this sequence.
+   *                                Should be set to false if replica tasks would index events in same order
+   * @param requests                Requests for which to allocate segments. All
+   *                                the requests must share the same partition space.
+   * @return Map from request to allocated segment id. The map does not contain
+   * entries for failed requests.
+   */
+  Map<SegmentCreateRequest, SegmentIdWithShardSpec> allocatePendingSegments(
+      String dataSource,
+      Interval interval,
+      boolean skipSegmentLineageCheck,
+      List<SegmentCreateRequest> requests
+  );
+
   /**
    * Allocate a new pending segment in the pending segments table. This segment identifier will never be given out
    * again, <em>unless</em> another call is made with the same dataSource, sequenceName, and previousSegmentId.
diff --git a/server/src/main/java/org/apache/druid/indexing/overlord/SegmentCreateRequest.java b/server/src/main/java/org/apache/druid/indexing/overlord/SegmentCreateRequest.java
new file mode 100644
index 000000000000..b43e46d8e7a5
--- /dev/null
+++ b/server/src/main/java/org/apache/druid/indexing/overlord/SegmentCreateRequest.java
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.overlord;
+
+import org.apache.druid.timeline.partition.PartialShardSpec;
+
+/**
+ * Contains information used by {@link IndexerMetadataStorageCoordinator} for
+ * creating a new segment.
+ * <p>
+ * The {@code sequenceName} and {@code previousSegmentId} fields are meant to
+ * make it easy for two independent ingestion tasks to produce the same series
+ * of segments.
+ */
+public class SegmentCreateRequest
+{
+  // DO NOT IMPLEMENT equals or hashCode for this class as each request must be
+  // treated as unique even if it is for the same parameters
+
+  private final String version;
+  private final String sequenceName;
+  private final String previousSegmentId;
+  private final PartialShardSpec partialShardSpec;
+
+  public SegmentCreateRequest(
+      String sequenceName,
+      String previousSegmentId,
+      String version,
+      PartialShardSpec partialShardSpec
+  )
+  {
+    this.sequenceName = sequenceName;
+    this.previousSegmentId = previousSegmentId == null ? "" : previousSegmentId;
+    this.version = version;
+    this.partialShardSpec = partialShardSpec;
+  }
+
+  public String getSequenceName()
+  {
+    return sequenceName;
+  }
+
+  /**
+   * Non-null previous segment id. This can be used for persisting to the
+   * pending segments table in the metadata store.
+   */
+  public String getPreviousSegmentId()
+  {
+    return previousSegmentId;
+  }
+
+  public String getVersion()
+  {
+    return version;
+  }
+
+  public PartialShardSpec getPartialShardSpec()
+  {
+    return partialShardSpec;
+  }
+}
diff --git a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
index cc42d77e1b70..bb7759a8b5d6 100644
--- a/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
+++ b/server/src/main/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinator.java
@@ -28,12 +28,14 @@
 import com.google.common.collect.ImmutableSet;
 import com.google.common.collect.Iterables;
 import com.google.common.collect.Lists;
+import com.google.common.hash.Hasher;
 import com.google.common.hash.Hashing;
 import com.google.common.io.BaseEncoding;
 import com.google.inject.Inject;
 import org.apache.commons.lang.StringEscapeUtils;
 import org.apache.druid.indexing.overlord.DataSourceMetadata;
 import org.apache.druid.indexing.overlord.IndexerMetadataStorageCoordinator;
+import org.apache.druid.indexing.overlord.SegmentCreateRequest;
 import org.apache.druid.indexing.overlord.SegmentPublishResult;
 import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.java.util.common.DateTimes;
@@ -75,10 +77,13 @@
 import javax.validation.constraints.NotNull;
 import java.io.IOException;
 import java.sql.ResultSet;
+import java.sql.SQLException;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collection;
 import java.util.Collections;
+import java.util.Comparator;
+import java.util.HashMap;
 import java.util.HashSet;
 import java.util.List;
 import java.util.Map;
@@ -221,6 +226,10 @@ public int markSegmentsAsUnusedWithinInterval(String dataSource, Interval interv
     return numSegmentsMarkedUnused;
   }
 
+  /**
+   * Fetches all the pending segments, whose interval overlaps with the given
+   * search interval from the metadata store.
+   */
   private Set<SegmentIdWithShardSpec> getPendingSegmentsForIntervalWithHandle(
       final Handle handle,
       final String dataSource,
@@ -481,6 +490,23 @@ public int getSqlMetadataMaxRetry()
     return SQLMetadataConnector.DEFAULT_MAX_TRIES;
   }
 
+  @Override
+  public Map<SegmentCreateRequest, SegmentIdWithShardSpec> allocatePendingSegments(
+      String dataSource,
+      Interval allocateInterval,
+      boolean skipSegmentLineageCheck,
+      List<SegmentCreateRequest> requests
+  )
+  {
+    Preconditions.checkNotNull(dataSource, "dataSource");
+    Preconditions.checkNotNull(allocateInterval, "interval");
+
+    final Interval interval = allocateInterval.withChronology(ISOChronology.getInstanceUTC());
+    return connector.retryWithHandle(
+        handle -> allocatePendingSegments(handle, dataSource, interval, skipSegmentLineageCheck, requests)
+    );
+  }
+
   @Override
   public SegmentIdWithShardSpec allocatePendingSegment(
       final String dataSource,
@@ -599,6 +625,81 @@ private SegmentIdWithShardSpec allocatePendingSegmentWithSegmentLineageCheck(
     return newIdentifier;
   }
 
+  private Map<SegmentCreateRequest, SegmentIdWithShardSpec> allocatePendingSegments(
+      final Handle handle,
+      final String dataSource,
+      final Interval interval,
+      final boolean skipSegmentLineageCheck,
+      final List<SegmentCreateRequest> requests
+  ) throws IOException
+  {
+    final Map<SegmentCreateRequest, CheckExistingSegmentIdResult> existingSegmentIds;
+    if (skipSegmentLineageCheck) {
+      existingSegmentIds = getExistingSegmentIdsSkipLineageCheck(handle, dataSource, interval, requests);
+    } else {
+      existingSegmentIds = getExistingSegmentIdsWithLineageCheck(handle, dataSource, interval, requests);
+    }
+
+    // For every request see if a segment id already exists
+    final Map<SegmentCreateRequest, SegmentIdWithShardSpec> allocatedSegmentIds = new HashMap<>();
+    final List<SegmentCreateRequest> requestsForNewSegments = new ArrayList<>();
+    for (SegmentCreateRequest request : requests) {
+      CheckExistingSegmentIdResult existingSegmentId = existingSegmentIds.get(request);
+      if (existingSegmentId == null || !existingSegmentId.found) {
+        requestsForNewSegments.add(request);
+      } else if (existingSegmentId.segmentIdentifier != null) {
+        log.info("Found valid existing segment [%s] for request.", existingSegmentId.segmentIdentifier);
+        allocatedSegmentIds.put(request, existingSegmentId.segmentIdentifier);
+      } else {
+        log.info("Found clashing existing segment [%s] for request.", existingSegmentId);
+      }
+    }
+
+    // For each of the remaining requests, create a new segment
+    final Map<SegmentCreateRequest, SegmentIdWithShardSpec> createdSegments =
+        createNewSegments(handle, dataSource, interval, skipSegmentLineageCheck, requestsForNewSegments);
+
+    // SELECT -> INSERT can fail due to races; callers must be prepared to retry.
+    // Avoiding ON DUPLICATE KEY since it's not portable.
+    // Avoiding try/catch since it may cause inadvertent transaction-splitting.
+
+    // UNIQUE key for the row, ensuring we don't have more than one segment per sequence per interval.
+    // Using a single column instead of (sequence_name, sequence_prev_id) as some MySQL storage engines
+    // have difficulty with large unique keys (see https://github.com/apache/druid/issues/2319)
+    insertPendingSegmentsIntoMetastore(
+        handle,
+        createdSegments,
+        dataSource,
+        interval,
+        skipSegmentLineageCheck
+    );
+
+    allocatedSegmentIds.putAll(createdSegments);
+    return allocatedSegmentIds;
+  }
+
+  @SuppressWarnings("UnstableApiUsage")
+  private String getSequenceNameAndPrevIdSha(
+      SegmentCreateRequest request,
+      Interval interval,
+      boolean skipSegmentLineageCheck
+  )
+  {
+    final Hasher hasher = Hashing.sha1().newHasher()
+                                 .putBytes(StringUtils.toUtf8(request.getSequenceName()))
+                                 .putByte((byte) 0xff);
+    if (skipSegmentLineageCheck) {
+      hasher
+          .putLong(interval.getStartMillis())
+          .putLong(interval.getEndMillis());
+    } else {
+      hasher
+          .putBytes(StringUtils.toUtf8(request.getPreviousSegmentId()));
+    }
+
+    return BaseEncoding.base16().encode(hasher.hash().asBytes());
+  }
+
   @Nullable
   private SegmentIdWithShardSpec allocatePendingSegment(
       final Handle handle,
@@ -631,7 +732,6 @@ private SegmentIdWithShardSpec allocatePendingSegment(
     );
 
     if (result.found) {
-      // The found existing segment identifier can be null if its interval doesn't match with the given interval
       return result.segmentIdentifier;
     }
 
@@ -672,6 +772,95 @@ private SegmentIdWithShardSpec allocatePendingSegment(
     return newIdentifier;
   }
 
+  /**
+   * Returns a map from sequenceName to segment id.
+   */
+  private Map<SegmentCreateRequest, CheckExistingSegmentIdResult> getExistingSegmentIdsSkipLineageCheck(
+      Handle handle,
+      String dataSource,
+      Interval interval,
+      List<SegmentCreateRequest> requests
+  ) throws IOException
+  {
+    final Query<Map<String, Object>> query = handle
+        .createQuery(
+            StringUtils.format(
+                "SELECT sequence_name, payload "
+                + "FROM %s WHERE "
+                + "dataSource = :dataSource AND "
+                + "start = :start AND "
+                + "%2$send%2$s = :end",
+                dbTables.getPendingSegmentsTable(),
+                connector.getQuoteString()
+            )
+        )
+        .bind("dataSource", dataSource)
+        .bind("start", interval.getStart().toString())
+        .bind("end", interval.getEnd().toString());
+
+    final ResultIterator<PendingSegmentsRecord> dbSegments = query
+        .map((index, r, ctx) -> PendingSegmentsRecord.fromResultSet(r))
+        .iterator();
+
+    // Map from sequenceName to segment id
+    final Map<String, SegmentIdWithShardSpec> sequenceToSegmentId = new HashMap<>();
+    while (dbSegments.hasNext()) {
+      final PendingSegmentsRecord record = dbSegments.next();
+      final SegmentIdWithShardSpec segmentId =
+          jsonMapper.readValue(record.getPayload(), SegmentIdWithShardSpec.class);
+      sequenceToSegmentId.put(record.getSequenceName(), segmentId);
+    }
+
+    final Map<SegmentCreateRequest, CheckExistingSegmentIdResult> requestToResult = new HashMap<>();
+    for (SegmentCreateRequest request : requests) {
+      SegmentIdWithShardSpec segmentId = sequenceToSegmentId.get(request.getSequenceName());
+      requestToResult.put(request, new CheckExistingSegmentIdResult(segmentId != null, segmentId));
+    }
+
+    return requestToResult;
+  }
+
+  /**
+   * Returns a map from sequenceName to segment id.
+   */
+  private Map<SegmentCreateRequest, CheckExistingSegmentIdResult> getExistingSegmentIdsWithLineageCheck(
+      Handle handle,
+      String dataSource,
+      Interval interval,
+      List<SegmentCreateRequest> requests
+  ) throws IOException
+  {
+    // This cannot be batched because there doesn't seem to be a clean option:
+    // 1. WHERE must have sequence_name and sequence_prev_id but not start or end.
+    //    (sequence columns are used to find the matching segment whereas start and
+    //    end are used to determine if the found segment is valid or not)
+    // 2. IN filters on sequence_name and sequence_prev_id might perform worse than individual SELECTs?
+    // 3. IN filter on sequence_name alone might be a feasible option worth evaluating
+    final String sql = StringUtils.format(
+        "SELECT payload FROM %s WHERE "
+        + "dataSource = :dataSource AND "
+        + "sequence_name = :sequence_name AND "
+        + "sequence_prev_id = :sequence_prev_id",
+        dbTables.getPendingSegmentsTable()
+    );
+
+    final Map<SegmentCreateRequest, CheckExistingSegmentIdResult> requestToResult = new HashMap<>();
+    for (SegmentCreateRequest request : requests) {
+      CheckExistingSegmentIdResult result = checkAndGetExistingSegmentId(
+          handle.createQuery(sql)
+                .bind("dataSource", dataSource)
+                .bind("sequence_name", request.getSequenceName())
+                .bind("sequence_prev_id", request.getPreviousSegmentId()),
+          interval,
+          request.getSequenceName(),
+          request.getPreviousSegmentId()
+      );
+      requestToResult.put(request, result);
+    }
+
+    return requestToResult;
+  }
+
   private CheckExistingSegmentIdResult checkAndGetExistingSegmentId(
       final Query<Map<String, Object>> query,
       final Interval interval,
@@ -686,50 +875,36 @@ private CheckExistingSegmentIdResult checkAndGetExistingSegmentId(
     }
     final List<byte[]> existingBytes = boundQuery.map(ByteArrayMapper.FIRST).list();
 
-    if (!existingBytes.isEmpty()) {
+    if (existingBytes.isEmpty()) {
+      return new CheckExistingSegmentIdResult(false, null);
+    } else {
       final SegmentIdWithShardSpec existingIdentifier = jsonMapper.readValue(
           Iterables.getOnlyElement(existingBytes),
           SegmentIdWithShardSpec.class
       );
 
-      if (existingIdentifier.getInterval().getStartMillis() == interval.getStartMillis()
-          && existingIdentifier.getInterval().getEndMillis() == interval.getEndMillis()) {
-        if (previousSegmentId == null) {
-          log.info("Found existing pending segment [%s] for sequence[%s] in DB", existingIdentifier, sequenceName);
-        } else {
-          log.info(
-              "Found existing pending segment [%s] for sequence[%s] (previous = [%s]) in DB",
-              existingIdentifier,
-              sequenceName,
-              previousSegmentId
-          );
-        }
+      if (existingIdentifier.getInterval().isEqual(interval)) {
+        log.info(
+            "Found existing pending segment [%s] for sequence[%s] (previous = [%s]) in DB",
+            existingIdentifier,
+            sequenceName,
+            previousSegmentId
+        );
 
         return new CheckExistingSegmentIdResult(true, existingIdentifier);
       } else {
-        if (previousSegmentId == null) {
-          log.warn(
-              "Cannot use existing pending segment [%s] for sequence[%s] in DB, "
-              + "does not match requested interval[%s]",
-              existingIdentifier,
-              sequenceName,
-              interval
-          );
-        } else {
-          log.warn(
-              "Cannot use existing pending segment [%s] for sequence[%s] (previous = [%s]) in DB, "
-              + "does not match requested interval[%s]",
-              existingIdentifier,
-              sequenceName,
-              previousSegmentId,
-              interval
-          );
-        }
+        log.warn(
+            "Cannot use existing pending segment [%s] for sequence[%s] (previous = [%s]) in DB, "
+            + "does not match requested interval[%s]",
+            existingIdentifier,
+            sequenceName,
+            previousSegmentId,
+            interval
+        );
 
         return new CheckExistingSegmentIdResult(true, null);
       }
     }
-    return new CheckExistingSegmentIdResult(false, null);
   }
 
   private static class CheckExistingSegmentIdResult
@@ -745,6 +920,48 @@ private static class CheckExistingSegmentIdResult
     }
   }
 
+  private void insertPendingSegmentsIntoMetastore(
+      Handle handle,
+      Map<SegmentCreateRequest, SegmentIdWithShardSpec> createdSegments,
+      String dataSource,
+      Interval interval,
+      boolean skipSegmentLineageCheck
+  ) throws JsonProcessingException
+  {
+    final PreparedBatch insertBatch = handle.prepareBatch(
+        StringUtils.format(
+        "INSERT INTO %1$s (id, dataSource, created_date, start, %2$send%2$s, sequence_name, sequence_prev_id, "
+        + "sequence_name_prev_id_sha1, payload) "
+        + "VALUES (:id, :dataSource, :created_date, :start, :end, :sequence_name, :sequence_prev_id, "
+        + ":sequence_name_prev_id_sha1, :payload)",
+        dbTables.getPendingSegmentsTable(),
+        connector.getQuoteString()
+    ));
+
+    // Deduplicate the segment ids by inverting the map
+    Map<SegmentIdWithShardSpec, SegmentCreateRequest> segmentIdToRequest = new HashMap<>();
+    createdSegments.forEach((request, segmentId) -> segmentIdToRequest.put(segmentId, request));
+
+    for (Map.Entry<SegmentIdWithShardSpec, SegmentCreateRequest> entry : segmentIdToRequest.entrySet()) {
+      final SegmentCreateRequest request = entry.getValue();
+      final SegmentIdWithShardSpec segmentId = entry.getKey();
+      insertBatch.add()
+                 .bind("id", segmentId.toString())
+                 .bind("dataSource", dataSource)
+                 .bind("created_date", DateTimes.nowUtc().toString())
+                 .bind("start", interval.getStart().toString())
+                 .bind("end", interval.getEnd().toString())
+                 .bind("sequence_name", request.getSequenceName())
+                 .bind("sequence_prev_id", request.getPreviousSegmentId())
+                 .bind(
+                     "sequence_name_prev_id_sha1",
+                     getSequenceNameAndPrevIdSha(request, interval, skipSegmentLineageCheck)
+                 )
+                 .bind("payload", jsonMapper.writeValueAsBytes(segmentId));
+    }
+    insertBatch.execute();
+  }
+
   private void insertPendingSegmentIntoMetastore(
       Handle handle,
       SegmentIdWithShardSpec newIdentifier,
@@ -777,6 +994,204 @@ private void insertPendingSegmentIntoMetastore(
           .execute();
   }
 
+  private Map<SegmentCreateRequest, SegmentIdWithShardSpec> createNewSegments(
+      Handle handle,
+      String dataSource,
+      Interval interval,
+      boolean skipSegmentLineageCheck,
+      List<SegmentCreateRequest> requests
+  ) throws IOException
+  {
+    if (requests.isEmpty()) {
+      return Collections.emptyMap();
+    }
+
+    // Get the time chunk and associated data segments for the given interval, if any
+    final List<TimelineObjectHolder<String, DataSegment>> existingChunks =
+        getTimelineForIntervalsWithHandle(handle, dataSource, Collections.singletonList(interval))
+            .lookup(interval);
+
+    if (existingChunks.size() > 1) {
+      // Not possible to expand more than one chunk with a single segment.
+      log.warn(
+          "Cannot allocate new segments for dataSource[%s], interval[%s]: already have [%,d] chunks.",
+          dataSource,
+          interval,
+          existingChunks.size()
+      );
+      return Collections.emptyMap();
+    }
+
+    // Shard spec of any of the requests (as they are all compatible) can be used to
+    // identify existing shard specs that share partition space with the requested ones.
+    final PartialShardSpec partialShardSpec = requests.get(0).getPartialShardSpec();
+
+    // max partitionId of published data segments which share the same partition space.
+    SegmentIdWithShardSpec committedMaxId = null;
+
+    @Nullable
+    final String versionOfExistingChunk;
+    if (existingChunks.isEmpty()) {
+      versionOfExistingChunk = null;
+    } else {
+      TimelineObjectHolder<String, DataSegment> existingHolder = Iterables.getOnlyElement(existingChunks);
+      versionOfExistingChunk = existingHolder.getVersion();
+
+      // Don't use the stream API for performance.
+      for (DataSegment segment : FluentIterable
+          .from(existingHolder.getObject())
+          .transform(PartitionChunk::getObject)
+          // Here we check only the segments of the shardSpec which shares the same partition space with the given
+          // partialShardSpec. Note that OverwriteShardSpec doesn't share the partition space with others.
+          // See PartitionIds.
+          .filter(segment -> segment.getShardSpec().sharePartitionSpace(partialShardSpec))) {
+        if (committedMaxId == null
+            || committedMaxId.getShardSpec().getPartitionNum() < segment.getShardSpec().getPartitionNum()) {
+          committedMaxId = SegmentIdWithShardSpec.fromDataSegment(segment);
+        }
+      }
+    }
+
+
+    // Fetch the pending segments for this interval to determine max partitionId
+    // across all shard specs (published + pending).
+    // A pending segment having a higher partitionId must also be considered
+    // to avoid clashes when inserting the pending segment created here.
+    final Set<SegmentIdWithShardSpec> pendingSegments =
+        getPendingSegmentsForIntervalWithHandle(handle, dataSource, interval);
+
+    final Map<SegmentCreateRequest, SegmentIdWithShardSpec> createdSegments = new HashMap<>();
+    final Map<String, SegmentIdWithShardSpec> sequenceHashToSegment = new HashMap<>();
+
+    for (SegmentCreateRequest request : requests) {
+      // Check if the required segment has already been created in this batch
+      final String sequenceHash = getSequenceNameAndPrevIdSha(request, interval, skipSegmentLineageCheck);
+
+      final SegmentIdWithShardSpec createdSegment;
+      if (sequenceHashToSegment.containsKey(sequenceHash)) {
+        createdSegment = sequenceHashToSegment.get(sequenceHash);
+      } else {
+        createdSegment = createNewSegment(
+            request,
+            dataSource,
+            interval,
+            versionOfExistingChunk,
+            committedMaxId,
+            pendingSegments
+        );
+
+        // Add to pendingSegments to consider for partitionId
+        if (createdSegment != null) {
+          pendingSegments.add(createdSegment);
+          sequenceHashToSegment.put(sequenceHash, createdSegment);
+          log.info("Created new segment [%s]", createdSegment);
+        }
+      }
+
+      if (createdSegment != null) {
+        createdSegments.put(request, createdSegment);
+      }
+    }
+
+    log.info("Created [%d] new segments for [%d] allocate requests.", sequenceHashToSegment.size(), requests.size());
+    return createdSegments;
+  }
+
+  private SegmentIdWithShardSpec createNewSegment(
+      SegmentCreateRequest request,
+      String dataSource,
+      Interval interval,
+      String versionOfExistingChunk,
+      SegmentIdWithShardSpec committedMaxId,
+      Set<SegmentIdWithShardSpec> pendingSegments
+  )
+  {
+    final PartialShardSpec partialShardSpec = request.getPartialShardSpec();
+    final String existingVersion = request.getVersion();
+
+    // Include the committedMaxId while computing the overallMaxId
+    if (committedMaxId != null) {
+      pendingSegments.add(committedMaxId);
+    }
+
+    // If there is an existing chunk, find the max id with the same version as the existing chunk.
+    // There may still be a pending segment with a higher version (but no corresponding used segments)
+    // which may generate a clash with an existing segment once the new id is generated
+    final SegmentIdWithShardSpec overallMaxId =
+        pendingSegments.stream()
+                       .filter(id -> id.getShardSpec().sharePartitionSpace(partialShardSpec))
+                       .filter(id -> versionOfExistingChunk == null
+                                     || id.getVersion().equals(versionOfExistingChunk))
+                       .max(Comparator.comparing(SegmentIdWithShardSpec::getVersion)
+                                      .thenComparing(id -> id.getShardSpec().getPartitionNum()))
+                       .orElse(null);
+
+    // Determine the version of the new segment
+    final String newSegmentVersion;
+    if (versionOfExistingChunk != null) {
+      newSegmentVersion = versionOfExistingChunk;
+    } else if (overallMaxId != null) {
+      newSegmentVersion = overallMaxId.getVersion();
+    } else {
+      // this is the first segment for this interval
+      newSegmentVersion = null;
+    }
+
+    if (overallMaxId == null) {
+      // When appending segments, null overallMaxId means that we are allocating the very initial
+      // segment for this time chunk.
+      // This code is executed when the Overlord coordinates segment allocation, which is either you append segments
+      // or you use segment lock. Since the core partitions set is not determined for appended segments, we set
+      // it 0. When you use segment lock, the core partitions set doesn't work with it. We simply set it 0 so that the
+      // OvershadowableManager handles the atomic segment update.
+      final int newPartitionId = partialShardSpec.useNonRootGenerationPartitionSpace()
+                                 ? PartitionIds.NON_ROOT_GEN_START_PARTITION_ID
+                                 : PartitionIds.ROOT_GEN_START_PARTITION_ID;
+
+      String version = newSegmentVersion == null ? existingVersion : newSegmentVersion;
+      return new SegmentIdWithShardSpec(
+          dataSource,
+          interval,
+          version,
+          partialShardSpec.complete(jsonMapper, newPartitionId, 0)
+      );
+    } else if (!overallMaxId.getInterval().equals(interval)
+               || overallMaxId.getVersion().compareTo(existingVersion) > 0) {
+      log.warn(
+          "Cannot allocate new segment for dataSource[%s], interval[%s], existingVersion[%s]: conflicting segment[%s].",
+          dataSource,
+          interval,
+          existingVersion,
+          overallMaxId
+      );
+      return null;
+    } else if (committedMaxId != null
+               && committedMaxId.getShardSpec().getNumCorePartitions()
+                  == SingleDimensionShardSpec.UNKNOWN_NUM_CORE_PARTITIONS) {
+      log.warn(
+          "Cannot allocate new segment because of unknown core partition size of segment[%s], shardSpec[%s]",
+          committedMaxId,
+          committedMaxId.getShardSpec()
+      );
+      return null;
+    } else {
+      // The number of core partitions must always be chosen from the set of used segments in the SegmentTimeline.
+      // When the core partitions have been dropped, using pending segments may lead to an incorrect state
+      // where the chunk is believed to have core partitions and queries results are incorrect.
+
+      return new SegmentIdWithShardSpec(
+          dataSource,
+          interval,
+          Preconditions.checkNotNull(newSegmentVersion, "newSegmentVersion"),
+          partialShardSpec.complete(
+              jsonMapper,
+              overallMaxId.getShardSpec().getPartitionNum() + 1,
+              committedMaxId == null ? 0 : committedMaxId.getShardSpec().getNumCorePartitions()
+          )
+      );
+    }
+  }
+
   /**
    * This function creates a new segment for the given datasource/interval/etc. A critical
    * aspect of the creation is to make sure that the new version & new partition number will make
@@ -818,15 +1233,18 @@ private SegmentIdWithShardSpec createNewSegment(
       return null;
 
     } else {
-      // max partitionId of the committed shardSpecs which share the same partition space.
+      // max partitionId of published data segments which share the same partition space.
       SegmentIdWithShardSpec committedMaxId = null;
-      // max partitionId of the all shardSpecs including the pending ones which share the same partition space.
-      SegmentIdWithShardSpec overallMaxId;
 
-      if (!existingChunks.isEmpty()) {
+      @Nullable
+      final String versionOfExistingChunk;
+      if (existingChunks.isEmpty()) {
+        versionOfExistingChunk = null;
+      } else {
         TimelineObjectHolder<String, DataSegment> existingHolder = Iterables.getOnlyElement(existingChunks);
+        versionOfExistingChunk = existingHolder.getVersion();
 
-        //noinspection ConstantConditions
+        // Don't use the stream API for performance.
         for (DataSegment segment : FluentIterable
             .from(existingHolder.getObject())
             .transform(PartitionChunk::getObject)
@@ -834,8 +1252,6 @@ private SegmentIdWithShardSpec createNewSegment(
             // partialShardSpec. Note that OverwriteShardSpec doesn't share the partition space with others.
             // See PartitionIds.
             .filter(segment -> segment.getShardSpec().sharePartitionSpace(partialShardSpec))) {
-          // Don't use the stream API for performance.
-          // Note that this will compute the max id of existing, visible, data segments in the time chunk:
           if (committedMaxId == null
               || committedMaxId.getShardSpec().getPartitionNum() < segment.getShardSpec().getPartitionNum()) {
             committedMaxId = SegmentIdWithShardSpec.fromDataSegment(segment);
@@ -843,63 +1259,41 @@ private SegmentIdWithShardSpec createNewSegment(
         }
       }
 
-      // Get the version of the existing chunk, we might need it in some of the cases below
-      // to compute the new identifier's version
-      @Nullable
-      final String versionOfExistingChunk;
-      if (!existingChunks.isEmpty()) {
-        // remember only one chunk possible for given interval so get the first & only one
-        versionOfExistingChunk = existingChunks.get(0).getVersion();
-      } else {
-        versionOfExistingChunk = null;
-      }
-
 
-      // next, we need to enrich the overallMaxId computed with committed segments with the information of the pending segments
-      // it is possible that a pending segment has a higher id in which case we need that, it will work,
-      // and it will avoid clashes when inserting the new pending segment later in the caller of this method
+      // Fetch the pending segments for this interval to determine max partitionId
+      // across all shard specs (published + pending).
+      // A pending segment having a higher partitionId must also be considered
+      // to avoid clashes when inserting the pending segment created here.
       final Set<SegmentIdWithShardSpec> pendings = getPendingSegmentsForIntervalWithHandle(
           handle,
           dataSource,
           interval
       );
-      // Make sure we add the committed max id we obtained from the segments table:
       if (committedMaxId != null) {
         pendings.add(committedMaxId);
       }
-      //  Now compute the overallMaxId with all the information: pendings + segments:
-      // The versionOfExistingChunks filter is ensure that we pick the max id with the version of the existing chunk
-      // in the case that there may be a pending segment with a higher version but no corresponding used segments
+
+      // If there is an existing chunk, find the max id with the same version as the existing chunk.
+      // There may still be a pending segment with a higher version (but no corresponding used segments)
       // which may generate a clash with an existing segment once the new id is generated
+      final SegmentIdWithShardSpec overallMaxId;
       overallMaxId = pendings.stream()
                              .filter(id -> id.getShardSpec().sharePartitionSpace(partialShardSpec))
-                             .filter(id -> versionOfExistingChunk == null || id.getVersion()
-                                                                               .equals(versionOfExistingChunk))
-                             .max((id1, id2) -> {
-                               final int versionCompare = id1.getVersion().compareTo(id2.getVersion());
-                               if (versionCompare != 0) {
-                                 return versionCompare;
-                               } else {
-                                 return Integer.compare(
-                                     id1.getShardSpec().getPartitionNum(),
-                                     id2.getShardSpec().getPartitionNum()
-                                 );
-                               }
-                             })
+                             .filter(id -> versionOfExistingChunk == null
+                                           || id.getVersion().equals(versionOfExistingChunk))
+                             .max(Comparator.comparing(SegmentIdWithShardSpec::getVersion)
+                                            .thenComparing(id -> id.getShardSpec().getPartitionNum()))
                              .orElse(null);
 
-      // The following code attempts to compute the new version, if this
-      // new version is not null at the end of next block then it will be
-      // used as the new version in the case for initial or appended segment
+
+      // Determine the version of the new segment
       final String newSegmentVersion;
       if (versionOfExistingChunk != null) {
-        // segment version overrides, so pick that now that we know it exists
         newSegmentVersion = versionOfExistingChunk;
-      } else if (!pendings.isEmpty() && overallMaxId != null) {
-        // there is no visible segments in the time chunk, so pick the max id of pendings, as computed above
+      } else if (overallMaxId != null) {
         newSegmentVersion = overallMaxId.getVersion();
       } else {
-        // no segments, no pendings, so this must be the very first segment created for this interval
+        // this is the first segment for this interval
         newSegmentVersion = null;
       }
 
@@ -940,7 +1334,7 @@ private SegmentIdWithShardSpec createNewSegment(
         );
         return null;
       } else {
-        // The number of core partitions must always be chosen from the set of used segments in the VersionedIntervalTimeline.
+        // The number of core partitions must always be chosen from the set of used segments in the SegmentTimeline.
         // When the core partitions have been dropped, using pending segments may lead to an incorrect state
         // where the chunk is believed to have core partitions and queries results are incorrect.
 
@@ -1472,4 +1866,46 @@ public int removeDataSourceMetadataOlderThan(long timestamp, @NotNull Set<String
     );
   }
 
+  private static class PendingSegmentsRecord
+  {
+    private final String sequenceName;
+    private final byte[] payload;
+
+    /**
+     * The columns expected in the result set are:
+     * <ol>
+     *   <li>sequence_name</li>
+     *   <li>payload</li>
+     * </ol>
+     */
+    static PendingSegmentsRecord fromResultSet(ResultSet resultSet)
+    {
+      try {
+        return new PendingSegmentsRecord(
+            resultSet.getString(1),
+            resultSet.getBytes(2)
+        );
+      }
+      catch (SQLException e) {
+        throw new RuntimeException(e);
+      }
+    }
+
+    PendingSegmentsRecord(String sequenceName, byte[] payload)
+    {
+      this.payload = payload;
+      this.sequenceName = sequenceName;
+    }
+
+    public byte[] getPayload()
+    {
+      return payload;
+    }
+
+    public String getSequenceName()
+    {
+      return sequenceName;
+    }
+  }
+
 }
diff --git a/server/src/main/java/org/apache/druid/rpc/ServiceClient.java b/server/src/main/java/org/apache/druid/rpc/ServiceClient.java
index cb33f713d988..1c416f88a1dc 100644
--- a/server/src/main/java/org/apache/druid/rpc/ServiceClient.java
+++ b/server/src/main/java/org/apache/druid/rpc/ServiceClient.java
@@ -49,8 +49,10 @@ public interface ServiceClient
    * encountered error.
    *
    * Redirects from 3xx responses are followed up to a chain length of {@link #MAX_REDIRECTS} and do not consume
-   * attempts. Redirects are validated against the targets returned by {@link ServiceLocator}: the client will not
-   * follow a redirect to a target that does not appear in the returned {@link ServiceLocations}.
+   * attempts. Redirects are validated against the targets returned by {@link ServiceLocator}: the client will only
+   * follow redirects to targets that appear in {@link ServiceLocations}. If the client encounters a redirect to an
+   * unknown target, or if a redirect loop or self-redirect is detected, it is treated as an unavailable service and
+   * an attempt is consumed.
    *
    * If the service is unavailable at the time an attempt is made, the client will automatically retry based on
    * {@link ServiceRetryPolicy#retryNotAvailable()}. If true, an attempt is consumed and the client will try to locate
diff --git a/server/src/main/java/org/apache/druid/rpc/ServiceClientImpl.java b/server/src/main/java/org/apache/druid/rpc/ServiceClientImpl.java
index 1445b943e96e..eca2cfdc5a2e 100644
--- a/server/src/main/java/org/apache/druid/rpc/ServiceClientImpl.java
+++ b/server/src/main/java/org/apache/druid/rpc/ServiceClientImpl.java
@@ -21,6 +21,7 @@
 
 import com.google.common.annotations.VisibleForTesting;
 import com.google.common.base.Preconditions;
+import com.google.common.collect.ImmutableSet;
 import com.google.common.collect.Iterables;
 import com.google.common.util.concurrent.FutureCallback;
 import com.google.common.util.concurrent.Futures;
@@ -88,7 +89,7 @@ public <IntermediateType, FinalType> ListenableFuture<FinalType> asyncRequest(
   )
   {
     final SettableFuture<FinalType> retVal = SettableFuture.create();
-    tryRequest(requestBuilder, handler, retVal, 0, 0);
+    tryRequest(requestBuilder, handler, retVal, 0, ImmutableSet.of());
     return retVal;
   }
 
@@ -98,21 +99,35 @@ public ServiceClientImpl withRetryPolicy(ServiceRetryPolicy newRetryPolicy)
     return new ServiceClientImpl(serviceName, httpClient, serviceLocator, newRetryPolicy, connectExec);
   }
 
+  /**
+   * Internal helper used by {@link #asyncRequest(RequestBuilder, HttpResponseHandler)}.
+   *
+   * Handles retries by calling itself back in {@link #connectExec} with an incremented {@code attemptNumber}.
+   *
+   * @param requestBuilder    request builder from call to {@link #asyncRequest}
+   * @param handler           handler from call to {@link #asyncRequest}
+   * @param retVal            return future generated by {@link #asyncRequest}
+   * @param attemptNumber     attempt number; starts at 0 and is incremented on each retry
+   * @param redirectLocations redirect locations observed from the server on this attempt; used for detecting redirect
+   *                          loops and for limiting redirect chain length to {@link #MAX_REDIRECTS}. Cleared when
+   *                          a new attempt is issued.
+   */
   private <IntermediateType, FinalType> void tryRequest(
       final RequestBuilder requestBuilder,
       final HttpResponseHandler<IntermediateType, FinalType> handler,
       final SettableFuture<FinalType> retVal,
       final long attemptNumber,
-      final int redirectCount
+      final ImmutableSet<String> redirectLocations
   )
   {
     whenServiceReady(
-        serviceLocation -> {
+        serviceLocations -> {
           if (retVal.isCancelled()) {
             // Return early if the caller canceled the return future.
             return;
           }
 
+          final ServiceLocation serviceLocation = pick(serviceLocations);
           final long nextAttemptNumber = attemptNumber + 1;
 
           if (serviceLocation == null) {
@@ -128,7 +143,7 @@ private <IntermediateType, FinalType> void tryRequest(
               );
 
               connectExec.schedule(
-                  () -> tryRequest(requestBuilder, handler, retVal, attemptNumber + 1, redirectCount),
+                  () -> tryRequest(requestBuilder, handler, retVal, nextAttemptNumber, ImmutableSet.of()),
                   backoffMs,
                   TimeUnit.MILLISECONDS
               );
@@ -172,71 +187,15 @@ public void onSuccess(@Nullable final Either<StringFullResponseHolder, FinalType
                   try {
                     // result can be null if the HttpClient encounters a problem midstream on an unfinished response.
                     if (result != null && result.isValue()) {
-                      if (nextAttemptNumber > 1) {
-                        // There were retries. Log at INFO level to provide the user some closure.
-                        log.info(
-                            "Service [%s] request [%s %s] completed.",
-                            serviceName,
-                            request.getMethod(),
-                            request.getUrl()
-                        );
-                      } else {
-                        // No retries. Log at debug level to avoid cluttering the logs.
-                        log.debug(
-                            "Service [%s] request [%s %s] completed.",
-                            serviceName,
-                            request.getMethod(),
-                            request.getUrl()
-                        );
-                      }
-
-                      // Will not throw, because we checked result.isValue() earlier.
-                      retVal.set(result.valueOrThrow());
+                      handleResultValue(result.valueOrThrow());
                     } else {
                       final StringFullResponseHolder errorHolder = result != null ? result.error() : null;
 
                       if (errorHolder != null && isRedirect(errorHolder.getResponse().getStatus())) {
-                        // Redirect. Update preferredLocationNoPath if appropriate, then reissue.
-                        final String newUri = result.error().getResponse().headers().get("Location");
-
-                        if (redirectCount >= MAX_REDIRECTS) {
-                          retVal.setException(new RpcException(
-                              "Service [%s] redirected too many times [%d] to invalid url %s",
-                              serviceName,
-                              redirectCount,
-                              newUri
-                          ));
-                        } else {
-                          // Update preferredLocationNoPath if we got a redirect.
-                          final ServiceLocation redirectLocationNoPath = serviceLocationNoPathFromUri(newUri);
-
-                          if (redirectLocationNoPath != null) {
-                            preferredLocationNoPath.set(redirectLocationNoPath);
-                            connectExec.submit(
-                                () -> tryRequest(requestBuilder, handler, retVal, attemptNumber, redirectCount + 1)
-                            );
-                          } else {
-                            retVal.setException(
-                                new RpcException(
-                                    "Service [%s] redirected [%d] times to invalid URL [%s]",
-                                    serviceName,
-                                    redirectCount,
-                                    newUri
-                                )
-                            );
-                          }
-                        }
+                        handleRedirect(errorHolder);
                       } else if (shouldTry(nextAttemptNumber)
                                  && (errorHolder == null || retryPolicy.retryHttpResponse(errorHolder.getResponse()))) {
-                        // Retryable server response (or null errorHolder, which means null result, which can happen
-                        // if the HttpClient encounters an exception in the midst of response processing).
-                        final long backoffMs = computeBackoffMs(retryPolicy, attemptNumber);
-                        log.noStackTrace().info(buildErrorMessage(request, errorHolder, backoffMs, nextAttemptNumber));
-                        connectExec.schedule(
-                            () -> tryRequest(requestBuilder, handler, retVal, attemptNumber + 1, redirectCount),
-                            backoffMs,
-                            TimeUnit.MILLISECONDS
-                        );
+                        handleRetryableErrorResponse(errorHolder);
                       } else if (errorHolder != null) {
                         // Nonretryable server response.
                         retVal.setException(new HttpResponseException(errorHolder));
@@ -264,7 +223,7 @@ public void onFailure(final Throwable t)
                       log.noStackTrace().info(t, buildErrorMessage(request, null, backoffMs, nextAttemptNumber));
 
                       connectExec.schedule(
-                          () -> tryRequest(requestBuilder, handler, retVal, attemptNumber + 1, redirectCount),
+                          () -> tryRequest(requestBuilder, handler, retVal, nextAttemptNumber, ImmutableSet.of()),
                           backoffMs,
                           TimeUnit.MILLISECONDS
                       );
@@ -277,6 +236,135 @@ public void onFailure(final Throwable t)
                     retVal.setException(new RpcException(t, "Service [%s] handler exited unexpectedly", serviceName));
                   }
                 }
+
+                /**
+                 * Handles HTTP 2xx responses from the server.
+                 */
+                private void handleResultValue(final FinalType value)
+                {
+                  if (nextAttemptNumber > 1) {
+                    // There were retries. Log at INFO level to provide the user some closure.
+                    log.info(
+                        "Service [%s] request [%s %s] completed.",
+                        serviceName,
+                        request.getMethod(),
+                        request.getUrl()
+                    );
+                  } else {
+                    // No retries. Log at debug level to avoid cluttering the logs.
+                    log.debug(
+                        "Service [%s] request [%s %s] completed.",
+                        serviceName,
+                        request.getMethod(),
+                        request.getUrl()
+                    );
+                  }
+
+                  // Will not throw, because we checked result.isValue() earlier.
+                  retVal.set(value);
+                }
+
+                /**
+                 * Handles retryable HTTP error responses from the server.
+                 */
+                private void handleRetryableErrorResponse(final StringFullResponseHolder errorHolder)
+                {
+                  // Retryable server response (or null errorHolder, which means null result, which can happen
+                  // if the HttpClient encounters an exception in the midst of response processing).
+                  final long backoffMs = computeBackoffMs(retryPolicy, attemptNumber);
+                  log.info(buildErrorMessage(request, errorHolder, backoffMs, nextAttemptNumber));
+                  connectExec.schedule(
+                      () -> tryRequest(requestBuilder, handler, retVal, nextAttemptNumber, ImmutableSet.of()),
+                      backoffMs,
+                      TimeUnit.MILLISECONDS
+                  );
+                }
+
+                /**
+                 * Handles HTTP redirect responses from the server.
+                 */
+                private void handleRedirect(final StringFullResponseHolder errorHolder)
+                {
+                  // Redirect. Update preferredLocationNoPath if appropriate, then reissue.
+                  final String newUri = errorHolder.getResponse().headers().get("Location");
+                  final ServiceLocation redirectLocationNoPath = serviceLocationNoPathFromUri(newUri);
+
+                  if (redirectLocationNoPath == null) {
+                    // Redirect to invalid URL. Something is wrong with the server: fail immediately
+                    // without retries.
+                    retVal.setException(
+                        new RpcException(
+                            "Service [%s] redirected to invalid URL [%s]",
+                            serviceName,
+                            newUri
+                        )
+                    );
+                  } else if (serviceLocations.getLocations()
+                                             .stream()
+                                             .anyMatch(loc -> serviceLocationNoPath(loc)
+                                                 .equals(redirectLocationNoPath))) {
+                    // Valid redirect, to a server that is one of the known locations.
+                    final boolean isRedirectLoop = redirectLocations.contains(newUri);
+                    final boolean isRedirectChainTooLong = redirectLocations.size() >= MAX_REDIRECTS;
+
+                    if (isRedirectLoop || isRedirectChainTooLong) {
+                      // Treat redirect loops, or too-long redirect chains, as unavailable services.
+                      if (retryPolicy.retryNotAvailable() && shouldTry(nextAttemptNumber)) {
+                        final long backoffMs = computeBackoffMs(retryPolicy, attemptNumber);
+
+                        log.info(
+                            "Service [%s] issued too many redirects on attempt #%d; retrying in %,d ms.",
+                            serviceName,
+                            nextAttemptNumber,
+                            backoffMs
+                        );
+
+                        connectExec.schedule(
+                            () -> tryRequest(requestBuilder, handler, retVal, nextAttemptNumber, ImmutableSet.of()),
+                            backoffMs,
+                            TimeUnit.MILLISECONDS
+                        );
+                      } else {
+                        retVal.setException(new ServiceNotAvailableException(serviceName, "issued too many redirects"));
+                      }
+                    } else {
+                      // Valid redirect. Follow it without incrementing the attempt number.
+                      preferredLocationNoPath.set(redirectLocationNoPath);
+                      final ImmutableSet<String> newRedirectLocations =
+                          ImmutableSet.<String>builder().addAll(redirectLocations).add(newUri).build();
+                      connectExec.submit(
+                          () -> tryRequest(requestBuilder, handler, retVal, attemptNumber, newRedirectLocations)
+                      );
+                    }
+                  } else {
+                    // Redirect to a server that is not one of the known locations. Treat service as unavailable.
+                    if (retryPolicy.retryNotAvailable() && shouldTry(nextAttemptNumber)) {
+                      final long backoffMs = computeBackoffMs(retryPolicy, attemptNumber);
+
+                      log.info(
+                          "Service [%s] issued redirect to unknown URL [%s] on attempt #%d; retrying in %,d ms.",
+                          serviceName,
+                          newUri,
+                          nextAttemptNumber,
+                          backoffMs
+                      );
+
+                      connectExec.schedule(
+                          () -> tryRequest(requestBuilder, handler, retVal, nextAttemptNumber, ImmutableSet.of()),
+                          backoffMs,
+                          TimeUnit.MILLISECONDS
+                      );
+                    } else {
+                      retVal.setException(
+                          new ServiceNotAvailableException(
+                              serviceName,
+                              "issued redirect to unknown URL [%s]",
+                              newUri
+                          )
+                      );
+                    }
+                  }
+                }
               },
               connectExec
           );
@@ -285,7 +373,7 @@ public void onFailure(final Throwable t)
     );
   }
 
-  private <T> void whenServiceReady(final Consumer<ServiceLocation> callback, final SettableFuture<T> retVal)
+  private <T> void whenServiceReady(final Consumer<ServiceLocations> callback, final SettableFuture<T> retVal)
   {
     Futures.addCallback(
         serviceLocator.locate(),
@@ -300,8 +388,7 @@ public void onSuccess(final ServiceLocations locations)
             }
 
             try {
-              final ServiceLocation location = pick(locations);
-              callback.accept(location);
+              callback.accept(locations);
             }
             catch (Throwable t) {
               // It's a bug if this happens. The purpose of this line is to help us debug what went wrong.
@@ -328,10 +415,7 @@ private ServiceLocation pick(final ServiceLocations locations)
     if (preferred != null) {
       // Preferred location is set. Use it if it's one of known locations.
       for (final ServiceLocation location : locations.getLocations()) {
-        final ServiceLocation locationNoPath =
-            new ServiceLocation(location.getHost(), location.getPlaintextPort(), location.getTlsPort(), "");
-
-        if (locationNoPath.equals(preferred)) {
+        if (serviceLocationNoPath(location).equals(preferred)) {
           return location;
         }
       }
@@ -392,6 +476,9 @@ static long computeBackoffMs(final ServiceRetryPolicy retryPolicy, final long at
     );
   }
 
+  /**
+   * Returns a {@link ServiceLocation} without a path component, based on a URI.
+   */
   @Nullable
   @VisibleForTesting
   static ServiceLocation serviceLocationNoPathFromUri(@Nullable final String uriString)
@@ -423,6 +510,14 @@ static ServiceLocation serviceLocationNoPathFromUri(@Nullable final String uriSt
     }
   }
 
+  /**
+   * Returns a {@link ServiceLocation} without its path.
+   */
+  static ServiceLocation serviceLocationNoPath(final ServiceLocation location)
+  {
+    return new ServiceLocation(location.getHost(), location.getPlaintextPort(), location.getTlsPort(), "");
+  }
+
   @VisibleForTesting
   static boolean isRedirect(final HttpResponseStatus responseStatus)
   {
diff --git a/server/src/main/java/org/apache/druid/rpc/ServiceNotAvailableException.java b/server/src/main/java/org/apache/druid/rpc/ServiceNotAvailableException.java
index 290fa2cf7ab7..843ac2dfa54f 100644
--- a/server/src/main/java/org/apache/druid/rpc/ServiceNotAvailableException.java
+++ b/server/src/main/java/org/apache/druid/rpc/ServiceNotAvailableException.java
@@ -19,13 +19,20 @@
 
 package org.apache.druid.rpc;
 
+import org.apache.druid.java.util.common.StringUtils;
+
 /**
  * Returned by {@link ServiceClient#asyncRequest} when a request has failed because the service is not available.
  */
 public class ServiceNotAvailableException extends RpcException
 {
+  public ServiceNotAvailableException(final String serviceName, final String reason, final Object... reasonArgs)
+  {
+    super("Service [%s] %s", serviceName, StringUtils.format(reason, reasonArgs));
+  }
+
   public ServiceNotAvailableException(final String serviceName)
   {
-    super("Service [%s] is not available", serviceName);
+    this(serviceName, "is not available");
   }
 }
diff --git a/server/src/main/java/org/apache/druid/segment/InlineSegmentWrangler.java b/server/src/main/java/org/apache/druid/segment/InlineSegmentWrangler.java
index a68859359cde..6128dcf49f26 100644
--- a/server/src/main/java/org/apache/druid/segment/InlineSegmentWrangler.java
+++ b/server/src/main/java/org/apache/druid/segment/InlineSegmentWrangler.java
@@ -22,14 +22,14 @@
 import org.apache.druid.java.util.common.guava.Sequences;
 import org.apache.druid.query.DataSource;
 import org.apache.druid.query.InlineDataSource;
-import org.apache.druid.segment.join.JoinableFactory;
 import org.apache.druid.timeline.SegmentId;
 import org.joda.time.Interval;
 
+import java.util.ArrayList;
 import java.util.Collections;
 
 /**
- * A {@link JoinableFactory} for {@link InlineDataSource}.
+ * A {@link SegmentWrangler} for {@link InlineDataSource}.
  *
  * It is not valid to pass any other DataSource type to the "getSegmentsForIntervals" method.
  */
@@ -38,10 +38,22 @@ public class InlineSegmentWrangler implements SegmentWrangler
   private static final String SEGMENT_ID = "inline";
 
   @Override
+  @SuppressWarnings("unchecked")
   public Iterable<Segment> getSegmentsForIntervals(final DataSource dataSource, final Iterable<Interval> intervals)
   {
     final InlineDataSource inlineDataSource = (InlineDataSource) dataSource;
 
+    if (inlineDataSource.rowsAreArrayList()) {
+      return Collections.singletonList(
+          new ArrayListSegment<>(
+              SegmentId.dummy(SEGMENT_ID),
+              (ArrayList<Object[]>) inlineDataSource.getRowsAsList(),
+              inlineDataSource.rowAdapter(),
+              inlineDataSource.getRowSignature()
+          )
+      );
+    }
+
     return Collections.singletonList(
         new RowBasedSegment<>(
             SegmentId.dummy(SEGMENT_ID),
diff --git a/server/src/main/java/org/apache/druid/server/ClientQuerySegmentWalker.java b/server/src/main/java/org/apache/druid/server/ClientQuerySegmentWalker.java
index d6fe03a31d63..638e22919201 100644
--- a/server/src/main/java/org/apache/druid/server/ClientQuerySegmentWalker.java
+++ b/server/src/main/java/org/apache/druid/server/ClientQuerySegmentWalker.java
@@ -72,9 +72,9 @@
 
 /**
  * Query handler for the Broker processes (see CliBroker).
- *
+ * <p>
  * This class is responsible for:
- *
+ * <p>
  * 1) Running queries on the cluster using its 'clusterClient'
  * 2) Running queries locally (when all datasources are global) using its 'localClient'
  * 3) Inlining subqueries if necessary, in service of the above two goals
@@ -133,7 +133,7 @@ public ClientQuerySegmentWalker(
   {
     this(
         emitter,
-        (QuerySegmentWalker) clusterClient,
+        clusterClient,
         (QuerySegmentWalker) localClient,
         warehouse,
         joinableFactory,
@@ -291,20 +291,20 @@ private DataSource globalizeIfPossible(
 
   /**
    * Replace QueryDataSources with InlineDataSources when necessary and possible. "Necessary" is defined as:
-   *
+   * <p>
    * 1) For outermost subqueries: inlining is necessary if the toolchest cannot handle it.
    * 2) For all other subqueries (e.g. those nested under a join): inlining is always necessary.
    *
-   * @param dataSource           datasource to process.
-   * @param toolChestIfOutermost if provided, and if the provided datasource is a {@link QueryDataSource}, this method
-   *                             will consider whether the toolchest can handle a subquery on the datasource using
-   *                             {@link QueryToolChest#canPerformSubquery}. If the toolchest can handle it, then it will
-   *                             not be inlined. See {@link org.apache.druid.query.groupby.GroupByQueryQueryToolChest}
-   *                             for an example of a toolchest that can handle subqueries.
+   * @param dataSource                  datasource to process.
+   * @param toolChestIfOutermost        if provided, and if the provided datasource is a {@link QueryDataSource}, this method
+   *                                    will consider whether the toolchest can handle a subquery on the datasource using
+   *                                    {@link QueryToolChest#canPerformSubquery}. If the toolchest can handle it, then it will
+   *                                    not be inlined. See {@link org.apache.druid.query.groupby.GroupByQueryQueryToolChest}
+   *                                    for an example of a toolchest that can handle subqueries.
    * @param subqueryRowLimitAccumulator an accumulator for tracking the number of accumulated rows in all subqueries
    *                                    for a particular master query
-   * @param maxSubqueryRows      Max rows that all the subqueries generated by a master query can have, combined
-   * @param dryRun               if true, does not actually execute any subqueries, but will inline empty result sets.
+   * @param maxSubqueryRows             Max rows that all the subqueries generated by a master query can have, combined
+   * @param dryRun                      if true, does not actually execute any subqueries, but will inline empty result sets.
    */
   @SuppressWarnings({"rawtypes", "unchecked"}) // Subquery, toolchest, runner handling all use raw types
   private DataSource inlineIfNecessary(
@@ -331,15 +331,18 @@ private DataSource inlineIfNecessary(
           current = Iterables.getOnlyElement(current.getChildren());
         }
 
-        assert !(current instanceof QueryDataSource); // lgtm [java/contradictory-type-checks]
+        if (current instanceof QueryDataSource) {
+          throw new ISE("Got a QueryDataSource[%s], should've walked it away in the loop above.", current);
+        }
         current = inlineIfNecessary(current, null, subqueryRowLimitAccumulator, maxSubqueryRows, dryRun);
 
         while (!stack.isEmpty()) {
           current = stack.pop().withChildren(Collections.singletonList(current));
         }
 
-        assert current instanceof QueryDataSource;
-
+        if (!(current instanceof QueryDataSource)) {
+          throw new ISE("Should have a QueryDataSource, but got[%s] instead", current);
+        }
         if (toolChest.canPerformSubquery(((QueryDataSource) current).getQuery())) {
           return current;
         } else {
@@ -431,7 +434,9 @@ private <T> QueryRunner<T> decorateClusterRunner(Query<T> query, QueryRunner<T>
         .postProcess(
             objectMapper.convertValue(
                 query.context().getString("postProcessing"),
-                new TypeReference<PostProcessingOperator<T>>() {}
+                new TypeReference<PostProcessingOperator<T>>()
+                {
+                }
             )
         )
         .map(
@@ -572,7 +577,7 @@ private static <T, QueryType extends Query<T>> InlineDataSource toInlineDataSour
 
     final RowSignature signature = toolChest.resultArraySignature(query);
 
-    final List<Object[]> resultList = new ArrayList<>();
+    final ArrayList<Object[]> resultList = new ArrayList<>();
 
     toolChest.resultsAsArrays(query, results).accumulate(
         resultList,
diff --git a/server/src/main/java/org/apache/druid/server/LocalQuerySegmentWalker.java b/server/src/main/java/org/apache/druid/server/LocalQuerySegmentWalker.java
index 730eb3121d47..767e5fbd402b 100644
--- a/server/src/main/java/org/apache/druid/server/LocalQuerySegmentWalker.java
+++ b/server/src/main/java/org/apache/druid/server/LocalQuerySegmentWalker.java
@@ -93,12 +93,10 @@ public <T> QueryRunner<T> getQueryRunnerForIntervals(final Query<T> query, final
 
     final AtomicLong cpuAccumulator = new AtomicLong(0L);
 
-    final Function<SegmentReference, SegmentReference> segmentMapFn = analysis
-        .getDataSource()
-        .createSegmentMapFunction(
-            query,
-            cpuAccumulator
-        );
+    final Function<SegmentReference, SegmentReference> segmentMapFn =
+        analysis
+            .getDataSource()
+            .createSegmentMapFunction(query, cpuAccumulator);
 
 
     final QueryRunnerFactory<T, Query<T>> queryRunnerFactory = conglomerate.findFactory(query);
diff --git a/server/src/main/java/org/apache/druid/server/coordination/BatchDataSegmentAnnouncer.java b/server/src/main/java/org/apache/druid/server/coordination/BatchDataSegmentAnnouncer.java
index aa03ec6f4594..3d766be09832 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/BatchDataSegmentAnnouncer.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/BatchDataSegmentAnnouncer.java
@@ -36,6 +36,7 @@
 import org.apache.druid.java.util.common.DateTimes;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.java.util.common.lifecycle.LifecycleStop;
 import org.apache.druid.java.util.common.logger.Logger;
 import org.apache.druid.server.initialization.BatchDataSegmentAnnouncerConfig;
 import org.apache.druid.server.initialization.ZkPathsConfig;
@@ -129,6 +130,13 @@ public BatchDataSegmentAnnouncer(
     this(server, config, zkPaths, () -> announcer, jsonMapper, ZkEnablementConfig.ENABLED);
   }
 
+  @LifecycleStop
+  public void stop()
+  {
+    changes.stop();
+  }
+
+
   @Override
   public void announceSegment(DataSegment segment) throws IOException
   {
diff --git a/server/src/main/java/org/apache/druid/server/coordination/ChangeRequestHistory.java b/server/src/main/java/org/apache/druid/server/coordination/ChangeRequestHistory.java
index 65c8dbd62473..a0c45b4a3352 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/ChangeRequestHistory.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/ChangeRequestHistory.java
@@ -32,6 +32,7 @@
 
 import java.util.ArrayList;
 import java.util.LinkedHashMap;
+import java.util.LinkedHashSet;
 import java.util.List;
 import java.util.Map;
 import java.util.concurrent.ExecutorService;
@@ -43,6 +44,7 @@
  *
  * Clients call {@link #getRequestsSince} to get updates since given counter.
  */
+
 public class ChangeRequestHistory<T>
 {
   private static int MAX_SIZE = 1000;
@@ -74,11 +76,24 @@ public ChangeRequestHistory(int maxSize)
     this.singleThreadedExecutor = Execs.singleThreaded("SegmentChangeRequestHistory");
   }
 
+  public void stop()
+  {
+    singleThreadedExecutor.shutdownNow();
+    final LinkedHashSet<CustomSettableFuture<?>> futures = new LinkedHashSet<>(waitingFutures.keySet());
+    waitingFutures.clear();
+    for (CustomSettableFuture<?> theFuture : futures) {
+      theFuture.setException(new IllegalStateException("Server is shutting down."));
+    }
+  }
+
   /**
    * Add batch of segment changes update.
    */
   public synchronized void addChangeRequests(List<T> requests)
   {
+    if (singleThreadedExecutor.isShutdown()) {
+      return;
+    }
     for (T request : requests) {
       changes.add(new Holder<>(request, getLastCounter().inc()));
     }
@@ -108,6 +123,10 @@ public synchronized void addChangeRequest(T request)
   public synchronized ListenableFuture<ChangeRequestsSnapshot<T>> getRequestsSince(final Counter counter)
   {
     final CustomSettableFuture<T> future = new CustomSettableFuture<>(waitingFutures);
+    if (singleThreadedExecutor.isShutdown()) {
+      future.setException(new IllegalStateException("Server is shutting down."));
+      return future;
+    }
 
     if (counter.counter < 0) {
       future.setException(new IAE("counter[%s] must be >= 0", counter));
diff --git a/server/src/main/java/org/apache/druid/server/coordination/ServerManager.java b/server/src/main/java/org/apache/druid/server/coordination/ServerManager.java
index 26aabc2ddd68..7990a44b8506 100644
--- a/server/src/main/java/org/apache/druid/server/coordination/ServerManager.java
+++ b/server/src/main/java/org/apache/druid/server/coordination/ServerManager.java
@@ -194,9 +194,11 @@ public <T> QueryRunner<T> getQueryRunnerForSegments(Query<T> query, Iterable<Seg
     } else {
       return new ReportTimelineMissingSegmentQueryRunner<>(Lists.newArrayList(specs));
     }
-    final Function<SegmentReference, SegmentReference> segmentMapFn = query.getDataSource().createSegmentMapFunction(query, cpuTimeAccumulator);
+    final Function<SegmentReference, SegmentReference> segmentMapFn =
+        query.getDataSource()
+             .createSegmentMapFunction(query, cpuTimeAccumulator);
 
-    // We compute the join cache key here itself so it doesn't need to be re-computed for every segment
+    // We compute the datasource's cache key here itself so it doesn't need to be re-computed for every segment
     final Optional<byte[]> cacheKeyPrefix = Optional.ofNullable(query.getDataSource().getCacheKey());
 
     final FunctionalIterable<QueryRunner<T>> queryRunners = FunctionalIterable
diff --git a/server/src/main/java/org/apache/druid/server/emitter/EmitterModule.java b/server/src/main/java/org/apache/druid/server/emitter/EmitterModule.java
index c9db2e1dd962..7f4821768193 100644
--- a/server/src/main/java/org/apache/druid/server/emitter/EmitterModule.java
+++ b/server/src/main/java/org/apache/druid/server/emitter/EmitterModule.java
@@ -78,6 +78,7 @@ public void configure(Binder binder)
     binder.install(new HttpEmitterModule());
     binder.install(new ParametrizedUriEmitterModule());
     binder.install(new ComposingEmitterModule());
+    binder.install(new SwitchingEmitterModule());
 
     binder.bind(Emitter.class).toProvider(new EmitterProvider(emitterType)).in(LazySingleton.class);
 
diff --git a/processing/src/main/java/org/apache/druid/frame/write/FrameRowTooLargeException.java b/server/src/main/java/org/apache/druid/server/emitter/SwitchingEmitterConfig.java
similarity index 56%
rename from processing/src/main/java/org/apache/druid/frame/write/FrameRowTooLargeException.java
rename to server/src/main/java/org/apache/druid/server/emitter/SwitchingEmitterConfig.java
index e08c8ccc2cab..2d3da8f2453a 100644
--- a/processing/src/main/java/org/apache/druid/frame/write/FrameRowTooLargeException.java
+++ b/server/src/main/java/org/apache/druid/server/emitter/SwitchingEmitterConfig.java
@@ -17,27 +17,37 @@
  * under the License.
  */
 
-package org.apache.druid.frame.write;
+package org.apache.druid.server.emitter;
 
-import org.apache.druid.java.util.common.StringUtils;
+
+import com.fasterxml.jackson.annotation.JsonProperty;
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+
+import javax.validation.constraints.NotNull;
+import java.util.List;
+import java.util.Map;
 
 /**
- * Exception that is conventionally thrown by workers when they call
- * {@link FrameWriter#addSelection} and it returns false on an empty frame, or in
- * a situation where allocating a new frame is impractical.
  */
-public class FrameRowTooLargeException extends RuntimeException
+public class SwitchingEmitterConfig
 {
-  private final long maxFrameSize;
 
-  public FrameRowTooLargeException(final long maxFrameSize)
+  @JsonProperty
+  @NotNull
+  private Map<String, List<String>> emitters = ImmutableMap.of();
+
+  @JsonProperty
+  @NotNull
+  private List<String> defaultEmitters = ImmutableList.of();
+
+  public Map<String, List<String>> getEmitters()
   {
-    super(StringUtils.format("Row too large to add to frame (max frame size = %,d)", maxFrameSize));
-    this.maxFrameSize = maxFrameSize;
+    return emitters;
   }
 
-  public long getMaxFrameSize()
+  public List<String> getDefaultEmitter()
   {
-    return maxFrameSize;
+    return defaultEmitters;
   }
 }
diff --git a/server/src/main/java/org/apache/druid/server/emitter/SwitchingEmitterModule.java b/server/src/main/java/org/apache/druid/server/emitter/SwitchingEmitterModule.java
new file mode 100644
index 000000000000..281debd9960a
--- /dev/null
+++ b/server/src/main/java/org/apache/druid/server/emitter/SwitchingEmitterModule.java
@@ -0,0 +1,82 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.server.emitter;
+
+import com.google.common.collect.ImmutableList;
+import com.google.inject.Binder;
+import com.google.inject.Injector;
+import com.google.inject.Key;
+import com.google.inject.Module;
+import com.google.inject.Provides;
+import com.google.inject.name.Named;
+import com.google.inject.name.Names;
+import org.apache.druid.guice.JsonConfigProvider;
+import org.apache.druid.guice.ManageLifecycle;
+import org.apache.druid.java.util.common.logger.Logger;
+import org.apache.druid.java.util.emitter.core.Emitter;
+import org.apache.druid.java.util.emitter.core.SwitchingEmitter;
+
+import java.util.List;
+import java.util.Map;
+import java.util.stream.Collectors;
+
+public class SwitchingEmitterModule implements Module
+{
+
+  public static final String EMITTER_TYPE = "switching";
+
+  private static Logger log = new Logger(SwitchingEmitterModule.class);
+
+  @Override
+  public void configure(Binder binder)
+  {
+    JsonConfigProvider.bind(binder, "druid.emitter.switching", SwitchingEmitterConfig.class);
+  }
+
+  @Provides
+  @ManageLifecycle
+  @Named(EMITTER_TYPE)
+  public Emitter makeEmitter(SwitchingEmitterConfig config, final Injector injector)
+  {
+    log.info(
+        "Createing Switching emitter with %s, and default emitter %s",
+        config.getEmitters(),
+        config.getDefaultEmitter()
+    );
+    Map<String, List<Emitter>> switchingEmitters = config
+        .getEmitters()
+        .entrySet()
+        .stream()
+        .collect(
+            Collectors.toMap(
+                Map.Entry::getKey,
+                entry -> entry.getValue()
+                              .stream()
+                              .map(
+                                  emitterName -> injector.getInstance(Key.get(Emitter.class, Names.named(emitterName))))
+                              .collect(Collectors.toList())));
+
+    ImmutableList.Builder<Emitter> defaultEmittersBuilder = new ImmutableList.Builder<>();
+    for (String emitterName : config.getDefaultEmitter()) {
+      defaultEmittersBuilder.add(injector.getInstance(Key.get(Emitter.class, Names.named(emitterName))));
+    }
+    return new SwitchingEmitter(switchingEmitters, defaultEmittersBuilder.build().toArray(new Emitter[0]));
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/catalog/model/PropertyDefnTest.java b/server/src/test/java/org/apache/druid/catalog/model/PropertyDefnTest.java
index 99714f0411ef..ace31a252b95 100644
--- a/server/src/test/java/org/apache/druid/catalog/model/PropertyDefnTest.java
+++ b/server/src/test/java/org/apache/druid/catalog/model/PropertyDefnTest.java
@@ -39,6 +39,7 @@
 import static org.junit.Assert.assertEquals;
 import static org.junit.Assert.assertFalse;
 import static org.junit.Assert.assertNull;
+import static org.junit.Assert.assertSame;
 import static org.junit.Assert.assertThrows;
 import static org.junit.Assert.assertTrue;
 
@@ -50,9 +51,11 @@ public class PropertyDefnTest
   @Test
   public void testString()
   {
-    StringPropertyDefn prop = new StringPropertyDefn("prop");
+    StringPropertyDefn prop = new StringPropertyDefn("prop", ImmutableMap.of("foo", "bar"));
     assertEquals("prop", prop.name());
     assertEquals("String", prop.typeName());
+    assertEquals("bar", prop.attributes.get("foo"));
+    assertEquals(String.class, PropertyAttributes.sqlParameterType(prop));
 
     assertNull(prop.decode(null, mapper));
     assertEquals("value", prop.decode("value", mapper));
@@ -67,12 +70,21 @@ public void testString()
     assertThrows(Exception.class, () -> prop.validate(Arrays.asList("a", "b"), mapper));
   }
 
+  @Test
+  public void testCustomTypeName()
+  {
+    // Custom type name
+    StringPropertyDefn prop = new StringPropertyDefn("prop", ImmutableMap.of(PropertyAttributes.TYPE_NAME, "MyType"));
+    assertEquals("MyType", prop.typeName());
+  }
+
   @Test
   public void testBoolean()
   {
-    BooleanPropertyDefn prop = new BooleanPropertyDefn("prop");
+    BooleanPropertyDefn prop = new BooleanPropertyDefn("prop", null);
     assertEquals("prop", prop.name());
     assertEquals("Boolean", prop.typeName());
+    assertEquals(Boolean.class, PropertyAttributes.sqlParameterType(prop));
 
     assertNull(prop.decode(null, mapper));
     assertTrue(prop.decode("true", mapper));
@@ -86,9 +98,10 @@ public void testBoolean()
   @Test
   public void testInt()
   {
-    IntPropertyDefn prop = new IntPropertyDefn("prop");
+    IntPropertyDefn prop = new IntPropertyDefn("prop", null);
     assertEquals("prop", prop.name());
     assertEquals("Integer", prop.typeName());
+    assertEquals(Integer.class, PropertyAttributes.sqlParameterType(prop));
 
     assertNull(prop.decode(null, mapper));
     assertEquals((Integer) 0, prop.decode(0, mapper));
@@ -101,9 +114,10 @@ public void testInt()
   @Test
   public void testStringList()
   {
-    StringListPropertyDefn prop = new StringListPropertyDefn("prop");
+    StringListPropertyDefn prop = new StringListPropertyDefn("prop", null);
     assertEquals("prop", prop.name());
     assertEquals("string list", prop.typeName());
+    assertSame(String.class, PropertyAttributes.sqlParameterType(prop));
 
     assertNull(prop.decode(null, mapper));
     prop.validate(null, mapper);
@@ -120,10 +134,12 @@ public void testClusterKeyList()
     ListPropertyDefn<ClusterKeySpec> prop = new ListPropertyDefn<ClusterKeySpec>(
         "prop",
         "cluster key list",
-        new TypeReference<List<ClusterKeySpec>>() { }
+        new TypeReference<List<ClusterKeySpec>>() { },
+        null
     );
     assertEquals("prop", prop.name());
     assertEquals("cluster key list", prop.typeName());
+    assertNull(PropertyAttributes.sqlParameterType(prop));
 
     assertNull(prop.decode(null, mapper));
     List<Map<String, Object>> value = Arrays.asList(
diff --git a/server/src/test/java/org/apache/druid/catalog/model/table/BaseExternTableTest.java b/server/src/test/java/org/apache/druid/catalog/model/table/BaseExternTableTest.java
new file mode 100644
index 000000000000..8364aca514f9
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/catalog/model/table/BaseExternTableTest.java
@@ -0,0 +1,40 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.catalog.model.table;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+import org.apache.druid.catalog.model.ModelProperties.PropertyDefn;
+
+import java.util.List;
+
+public class BaseExternTableTest
+{
+  protected final ObjectMapper mapper = new ObjectMapper();
+
+  protected PropertyDefn<?> findProperty(List<PropertyDefn<?>> props, String name)
+  {
+    for (PropertyDefn<?> prop : props) {
+      if (prop.name().equals(name)) {
+        return prop;
+      }
+    }
+    return null;
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/catalog/model/table/HttpInputTableTest.java b/server/src/test/java/org/apache/druid/catalog/model/table/HttpInputTableTest.java
index a6a4b6935fb2..94a1cbe913aa 100644
--- a/server/src/test/java/org/apache/druid/catalog/model/table/HttpInputTableTest.java
+++ b/server/src/test/java/org/apache/druid/catalog/model/table/HttpInputTableTest.java
@@ -20,13 +20,15 @@
 package org.apache.druid.catalog.model.table;
 
 import com.fasterxml.jackson.databind.InjectableValues;
-import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableMap;
 import org.apache.druid.catalog.CatalogTest;
 import org.apache.druid.catalog.model.Columns;
+import org.apache.druid.catalog.model.ModelProperties.PropertyDefn;
 import org.apache.druid.catalog.model.ParameterizedDefn;
+import org.apache.druid.catalog.model.PropertyAttributes;
 import org.apache.druid.catalog.model.ResolvedTable;
 import org.apache.druid.catalog.model.TableDefnRegistry;
+import org.apache.druid.catalog.model.table.ExternalTableDefn.FormattedExternalTableDefn;
 import org.apache.druid.data.input.impl.CsvInputFormat;
 import org.apache.druid.data.input.impl.HttpInputSource;
 import org.apache.druid.data.input.impl.HttpInputSourceConfig;
@@ -40,16 +42,17 @@
 
 import java.util.Arrays;
 import java.util.Collections;
+import java.util.List;
 import java.util.Map;
 
 import static org.junit.Assert.assertEquals;
 import static org.junit.Assert.assertNotNull;
+import static org.junit.Assert.assertNull;
 import static org.junit.Assert.assertThrows;
 
 @Category(CatalogTest.class)
-public class HttpInputTableTest
+public class HttpInputTableTest extends BaseExternTableTest
 {
-  private final ObjectMapper mapper = new ObjectMapper();
   private final HttpTableDefn tableDefn = new HttpTableDefn();
   private final TableBuilder baseBuilder = TableBuilder.of(tableDefn)
       .description("http input")
@@ -84,16 +87,16 @@ public void testHappyPath()
     // Convert to an external spec
     ExternalTableSpec externSpec = tableDefn.convertToExtern(table);
 
-    HttpInputSource sourceSpec = (HttpInputSource) externSpec.inputSource();
+    HttpInputSource sourceSpec = (HttpInputSource) externSpec.inputSource;
     assertEquals("bob", sourceSpec.getHttpAuthenticationUsername());
     assertEquals("secret", ((DefaultPasswordProvider) sourceSpec.getHttpAuthenticationPasswordProvider()).getPassword());
     assertEquals("http://foo.com/my.csv", sourceSpec.getUris().get(0).toString());
 
     // Just a sanity check: details of CSV conversion are tested elsewhere.
-    CsvInputFormat csvFormat = (CsvInputFormat) externSpec.inputFormat();
+    CsvInputFormat csvFormat = (CsvInputFormat) externSpec.inputFormat;
     assertEquals(Arrays.asList("x", "y"), csvFormat.getColumns());
 
-    RowSignature sig = externSpec.signature();
+    RowSignature sig = externSpec.signature;
     assertEquals(Arrays.asList("x", "y"), sig.getColumnNames());
     assertEquals(ColumnType.STRING, sig.getColumnType(0).get());
     assertEquals(ColumnType.LONG, sig.getColumnType(1).get());
@@ -114,7 +117,7 @@ public void testEnvPassword()
     // Convert to an external spec
     ExternalTableSpec externSpec = tableDefn.convertToExtern(table);
 
-    HttpInputSource sourceSpec = (HttpInputSource) externSpec.inputSource();
+    HttpInputSource sourceSpec = (HttpInputSource) externSpec.inputSource;
     assertEquals("bob", sourceSpec.getHttpAuthenticationUsername());
     assertEquals("SECRET", ((EnvironmentVariablePasswordProvider) sourceSpec.getHttpAuthenticationPasswordProvider()).getVariable());
   }
@@ -134,17 +137,17 @@ public void testParameters()
     // Parameters
     ParameterizedDefn parameterizedTable = tableDefn;
     assertEquals(1, parameterizedTable.parameters().size());
-    assertNotNull(parameterizedTable.parameter(HttpTableDefn.URIS_PARAMETER));
+    assertNotNull(findProperty(parameterizedTable.parameters(), HttpTableDefn.URIS_PROPERTY));
 
     // Apply parameters
     Map<String, Object> params = ImmutableMap.of(
-        HttpTableDefn.URIS_PARAMETER, "foo.csv,bar.csv"
+        HttpTableDefn.URIS_PROPERTY, "foo.csv,bar.csv"
     );
 
     // Convert to an external spec
     ExternalTableSpec externSpec = parameterizedTable.applyParameters(table, params);
 
-    HttpInputSource sourceSpec = (HttpInputSource) externSpec.inputSource();
+    HttpInputSource sourceSpec = (HttpInputSource) externSpec.inputSource;
     assertEquals("bob", sourceSpec.getHttpAuthenticationUsername());
     assertEquals("SECRET", ((EnvironmentVariablePasswordProvider) sourceSpec.getHttpAuthenticationPasswordProvider()).getVariable());
     assertEquals(
@@ -165,7 +168,7 @@ public void testNoTemplate()
 
     // Apply parameters
     Map<String, Object> params = ImmutableMap.of(
-        HttpTableDefn.URIS_PARAMETER, "foo.csv,bar.csv"
+        HttpTableDefn.URIS_PROPERTY, "foo.csv,bar.csv"
     );
 
     // Convert to an external spec
@@ -193,7 +196,7 @@ public void testInvalidParameters()
         .buildResolved(mapper);
 
     Map<String, Object> params = ImmutableMap.of(
-        HttpTableDefn.URIS_PARAMETER, "foo.csv"
+        HttpTableDefn.URIS_PROPERTY, "foo.csv"
     );
     assertThrows(IAE.class, () -> tableDefn.applyParameters(table, params));
   }
@@ -209,4 +212,48 @@ public void testInvalidURI()
 
     assertThrows(IAE.class, () -> table.validate());
   }
+
+  @Test
+  public void testSqlFunction()
+  {
+    List<PropertyDefn<?>> params = tableDefn.tableFunctionParameters();
+
+    // Ensure the relevant properties are available as SQL function parameters
+    PropertyDefn<?> userProp = findProperty(params, HttpTableDefn.USER_PROPERTY);
+    assertNotNull(userProp);
+    assertEquals(String.class, PropertyAttributes.sqlParameterType(userProp));
+
+    PropertyDefn<?> pwdProp = findProperty(params, HttpTableDefn.PASSWORD_PROPERTY);
+    assertNotNull(pwdProp);
+    assertEquals(String.class, PropertyAttributes.sqlParameterType(pwdProp));
+
+    PropertyDefn<?> urisProp = findProperty(params, HttpTableDefn.URIS_PROPERTY);
+    assertNotNull(urisProp);
+    assertEquals(String.class, PropertyAttributes.sqlParameterType(urisProp));
+
+    assertNull(findProperty(params, HttpTableDefn.URI_TEMPLATE_PROPERTY));
+
+    PropertyDefn<?> formatProp = findProperty(params, FormattedExternalTableDefn.FORMAT_PROPERTY);
+    assertNotNull(formatProp);
+    assertEquals(String.class, PropertyAttributes.sqlParameterType(formatProp));
+
+    // Pretend to accept values for the SQL parameters.
+    final ResolvedTable table = TableBuilder.of(tableDefn)
+        .property(userProp.name(), userProp.decodeSqlValue("bob", mapper))
+        .property(pwdProp.name(), pwdProp.decodeSqlValue("secret", mapper))
+        .property(urisProp.name(), urisProp.decodeSqlValue("http://foo.com/foo.csv, http://foo.com/bar.csv", mapper))
+        .property(formatProp.name(), formatProp.decodeSqlValue(InputFormats.CSV_FORMAT_TYPE, mapper))
+        .column("x", Columns.VARCHAR)
+        .column("y", Columns.BIGINT)
+        .buildResolved(mapper);
+
+    ExternalTableSpec externSpec = tableDefn.convertToExtern(table);
+    HttpInputSource sourceSpec = (HttpInputSource) externSpec.inputSource;
+    assertEquals("bob", sourceSpec.getHttpAuthenticationUsername());
+    assertEquals("secret", ((DefaultPasswordProvider) sourceSpec.getHttpAuthenticationPasswordProvider()).getPassword());
+    assertEquals(
+        HttpTableDefn.convertUriList(Arrays.asList("http://foo.com/foo.csv", "http://foo.com/bar.csv")),
+        sourceSpec.getUris()
+    );
+  }
 }
diff --git a/server/src/test/java/org/apache/druid/catalog/model/table/InlineTableTest.java b/server/src/test/java/org/apache/druid/catalog/model/table/InlineTableTest.java
index f8d4057a4ce1..4934feb7f6ad 100644
--- a/server/src/test/java/org/apache/druid/catalog/model/table/InlineTableTest.java
+++ b/server/src/test/java/org/apache/druid/catalog/model/table/InlineTableTest.java
@@ -75,14 +75,14 @@ public void testValidData()
     // Convert to an external spec
     ExternalTableSpec externSpec = tableDefn.convertToExtern(table);
 
-    InlineInputSource inlineSpec = (InlineInputSource) externSpec.inputSource();
+    InlineInputSource inlineSpec = (InlineInputSource) externSpec.inputSource;
     assertEquals("a,b\nc,d\n", inlineSpec.getData());
 
     // Just a sanity check: details of CSV conversion are tested elsewhere.
-    CsvInputFormat csvFormat = (CsvInputFormat) externSpec.inputFormat();
+    CsvInputFormat csvFormat = (CsvInputFormat) externSpec.inputFormat;
     assertEquals(Arrays.asList("x", "y"), csvFormat.getColumns());
 
-    RowSignature sig = externSpec.signature();
+    RowSignature sig = externSpec.signature;
     assertEquals(Arrays.asList("x", "y"), sig.getColumnNames());
     assertEquals(ColumnType.STRING, sig.getColumnType(0).get());
     assertEquals(ColumnType.LONG, sig.getColumnType(1).get());
diff --git a/server/src/test/java/org/apache/druid/catalog/model/table/LocalTableTest.java b/server/src/test/java/org/apache/druid/catalog/model/table/LocalTableTest.java
index 9246078fe64f..27edcbaf82a1 100644
--- a/server/src/test/java/org/apache/druid/catalog/model/table/LocalTableTest.java
+++ b/server/src/test/java/org/apache/druid/catalog/model/table/LocalTableTest.java
@@ -19,13 +19,15 @@
 
 package org.apache.druid.catalog.model.table;
 
-import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableMap;
 import org.apache.druid.catalog.CatalogTest;
 import org.apache.druid.catalog.model.Columns;
+import org.apache.druid.catalog.model.ModelProperties.PropertyDefn;
 import org.apache.druid.catalog.model.ParameterizedDefn;
+import org.apache.druid.catalog.model.PropertyAttributes;
 import org.apache.druid.catalog.model.ResolvedTable;
 import org.apache.druid.catalog.model.TableDefnRegistry;
+import org.apache.druid.catalog.model.table.ExternalTableDefn.FormattedExternalTableDefn;
 import org.apache.druid.data.input.impl.CsvInputFormat;
 import org.apache.druid.data.input.impl.LocalInputSource;
 import org.apache.druid.java.util.common.IAE;
@@ -37,6 +39,7 @@
 import java.io.File;
 import java.util.Arrays;
 import java.util.Collections;
+import java.util.List;
 import java.util.Map;
 
 import static org.junit.Assert.assertEquals;
@@ -45,9 +48,8 @@
 import static org.junit.Assert.assertTrue;
 
 @Category(CatalogTest.class)
-public class LocalTableTest
+public class LocalTableTest extends BaseExternTableTest
 {
-  private final ObjectMapper mapper = new ObjectMapper();
   private final LocalTableDefn tableDefn = new LocalTableDefn();
   private final TableBuilder baseBuilder = TableBuilder.of(tableDefn)
       .description("local file input")
@@ -74,16 +76,16 @@ public void testFullyDefined()
     // Convert to an external spec
     ExternalTableSpec externSpec = tableDefn.convertToExtern(table);
 
-    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource();
+    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource;
     assertEquals("/tmp", sourceSpec.getBaseDir().toString());
     assertEquals("*.csv", sourceSpec.getFilter());
     assertEquals("my.csv", sourceSpec.getFiles().get(0).toString());
 
     // Just a sanity check: details of CSV conversion are tested elsewhere.
-    CsvInputFormat csvFormat = (CsvInputFormat) externSpec.inputFormat();
+    CsvInputFormat csvFormat = (CsvInputFormat) externSpec.inputFormat;
     assertEquals(Arrays.asList("x", "y"), csvFormat.getColumns());
 
-    RowSignature sig = externSpec.signature();
+    RowSignature sig = externSpec.signature;
     assertEquals(Arrays.asList("x", "y"), sig.getColumnNames());
     assertEquals(ColumnType.STRING, sig.getColumnType(0).get());
     assertEquals(ColumnType.LONG, sig.getColumnType(1).get());
@@ -103,7 +105,7 @@ public void testNoFilter()
     // Convert to an external spec
     ExternalTableSpec externSpec = tableDefn.convertToExtern(table);
 
-    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource();
+    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource;
     assertEquals("/tmp", sourceSpec.getBaseDir().toString());
     assertEquals("*", sourceSpec.getFilter());
     assertEquals("my.csv", sourceSpec.getFiles().get(0).toString());
@@ -123,7 +125,7 @@ public void testNoFiles()
     // Convert to an external spec
     ExternalTableSpec externSpec = tableDefn.convertToExtern(table);
 
-    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource();
+    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource;
     assertEquals("/tmp", sourceSpec.getBaseDir().toString());
     assertEquals("*.csv", sourceSpec.getFilter());
     assertTrue(sourceSpec.getFiles().isEmpty());
@@ -159,10 +161,7 @@ public void testFilesParameter()
         .buildResolved(mapper);
 
     ParameterizedDefn parameterizedTable = tableDefn;
-    assertEquals(2, parameterizedTable.parameters().size());
-    assertNotNull(parameterizedTable.parameter(LocalTableDefn.FILE_FILTER_PROPERTY));
-    assertNotNull(parameterizedTable.parameter(LocalTableDefn.FILES_PROPERTY));
-
+    assertEquals(1, parameterizedTable.parameters().size());
 
     // Apply files parameter
     Map<String, Object> params = ImmutableMap.of(
@@ -172,7 +171,7 @@ public void testFilesParameter()
     // Convert to an external spec
     ExternalTableSpec externSpec = parameterizedTable.applyParameters(table, params);
 
-    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource();
+    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource;
     assertEquals("/tmp", sourceSpec.getBaseDir().toString());
     assertEquals("*", sourceSpec.getFilter());
     assertEquals(
@@ -196,9 +195,45 @@ public void testFilterParameter()
     // Convert to an external spec
     ExternalTableSpec externSpec = tableDefn.applyParameters(table, params);
 
-    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource();
+    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource;
     assertEquals("/tmp", sourceSpec.getBaseDir().toString());
     assertEquals("Oct*.csv", sourceSpec.getFilter());
     assertTrue(sourceSpec.getFiles().isEmpty());
   }
+
+  @Test
+  public void testSqlFunction()
+  {
+    List<PropertyDefn<?>> params = tableDefn.tableFunctionParameters();
+
+    // Ensure the relevant properties are available as SQL function parameters
+    PropertyDefn<?> fileDirProp = findProperty(params, LocalTableDefn.BASE_DIR_PROPERTY);
+    assertNotNull(fileDirProp);
+    assertEquals(String.class, PropertyAttributes.sqlParameterType(fileDirProp));
+
+    PropertyDefn<?> filesProp = findProperty(params, LocalTableDefn.FILES_PROPERTY);
+    assertNotNull(filesProp);
+    assertEquals(String.class, PropertyAttributes.sqlParameterType(fileDirProp));
+
+    PropertyDefn<?> formatProp = findProperty(params, FormattedExternalTableDefn.FORMAT_PROPERTY);
+    assertNotNull(formatProp);
+    assertEquals(String.class, PropertyAttributes.sqlParameterType(formatProp));
+
+    // Pretend to accept values for the SQL parameters.
+    final ResolvedTable table = TableBuilder.of(tableDefn)
+        .property(fileDirProp.name(), fileDirProp.decodeSqlValue("/tmp", mapper))
+        .property(filesProp.name(), filesProp.decodeSqlValue("Oct.csv, Nov.csv", mapper))
+        .property(formatProp.name(), formatProp.decodeSqlValue(InputFormats.CSV_FORMAT_TYPE, mapper))
+        .column("x", Columns.VARCHAR)
+        .column("y", Columns.BIGINT)
+        .buildResolved(mapper);
+
+    ExternalTableSpec externSpec = tableDefn.convertToExtern(table);
+    LocalInputSource sourceSpec = (LocalInputSource) externSpec.inputSource;
+    assertEquals("/tmp", sourceSpec.getBaseDir().toString());
+    assertEquals(
+        Arrays.asList(new File("Oct.csv"), new File("Nov.csv")),
+        sourceSpec.getFiles()
+    );
+  }
 }
diff --git a/server/src/test/java/org/apache/druid/curator/CuratorModuleTest.java b/server/src/test/java/org/apache/druid/curator/CuratorModuleTest.java
index 20b86dc59660..5b88cb59f434 100644
--- a/server/src/test/java/org/apache/druid/curator/CuratorModuleTest.java
+++ b/server/src/test/java/org/apache/druid/curator/CuratorModuleTest.java
@@ -120,7 +120,7 @@ private Injector newInjector(final Properties props)
     return new StartupInjectorBuilder()
         .add(
             new LifecycleModule(),
-            new CuratorModule(),
+            new CuratorModule(false),
             binder -> binder.bind(Properties.class).toInstance(props)
          )
         .build();
diff --git a/server/src/test/java/org/apache/druid/guice/DruidInjectorBuilderTest.java b/server/src/test/java/org/apache/druid/guice/DruidInjectorBuilderTest.java
new file mode 100644
index 000000000000..d55ebe8f16b1
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/guice/DruidInjectorBuilderTest.java
@@ -0,0 +1,308 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.guice;
+
+import com.fasterxml.jackson.annotation.JsonTypeInfo;
+import com.fasterxml.jackson.annotation.JsonTypeName;
+import com.fasterxml.jackson.databind.Module;
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.fasterxml.jackson.databind.module.SimpleModule;
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableSet;
+import com.google.inject.Binder;
+import com.google.inject.Injector;
+import com.google.inject.Key;
+import org.apache.druid.discovery.NodeRole;
+import org.apache.druid.guice.annotations.Json;
+import org.apache.druid.guice.annotations.LoadScope;
+import org.apache.druid.initialization.CoreInjectorBuilder;
+import org.apache.druid.initialization.DruidModule;
+import org.apache.druid.java.util.common.ISE;
+import org.junit.Test;
+
+import javax.inject.Inject;
+import java.io.IOException;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Properties;
+
+import static org.junit.Assert.assertSame;
+import static org.junit.Assert.assertThrows;
+import static org.junit.Assert.assertTrue;
+
+public class DruidInjectorBuilderTest
+{
+  @JsonTypeInfo(use = JsonTypeInfo.Id.NAME, property = "type")
+  public static class MockObject
+  {
+  }
+
+  @JsonTypeName("extn")
+  public static class MockObjectExtension extends MockObject
+  {
+  }
+
+  public interface MockInterface
+  {
+  }
+
+  public static class MockComponent implements MockInterface
+  {
+  }
+
+  private static class MockGuiceModule implements com.google.inject.Module
+  {
+    @Inject
+    public Properties properties;
+
+    @Override
+    public void configure(Binder binder)
+    {
+      binder.bind(MockInterface.class).to(MockComponent.class).in(LazySingleton.class);
+    }
+  }
+
+  private static class MockDruidModule implements DruidModule
+  {
+    @Inject
+    public Properties properties;
+
+    @Override
+    public void configure(Binder binder)
+    {
+    }
+
+    @Override
+    public List<? extends Module> getJacksonModules()
+    {
+      return ImmutableList.<Module>of(
+          new SimpleModule("MockModule").registerSubtypes(MockObjectExtension.class)
+      );
+    }
+  }
+
+  @LoadScope(roles = NodeRole.BROKER_JSON_NAME)
+  private static class MockRoleModule extends MockDruidModule
+  {
+  }
+
+  @Test
+  public void testEmpty()
+  {
+    Properties props = new Properties();
+    props.put("foo", "bar");
+    Injector injector = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withProperties(props)
+          .build()
+    ).build();
+
+    // Returns explicit properties
+    Properties propsInstance = injector.getInstance(Properties.class);
+    assertSame(props, propsInstance);
+  }
+
+  /**
+   * Test the most generic form: addInput. Calls addModule() internally.
+   */
+  @Test
+  public void testAddInputModules() throws IOException
+  {
+    Properties props = new Properties();
+    props.put("foo", "bar");
+    MockGuiceModule guiceModule = new MockGuiceModule();
+    MockDruidModule druidModule = new MockDruidModule();
+    Injector injector = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withProperties(props)
+          .build()
+    )
+        .addInput(guiceModule)
+        .addInput(druidModule)
+        .build();
+
+    // Verify injection occurred
+    assertSame(props, guiceModule.properties);
+    assertSame(props, druidModule.properties);
+    verifyInjector(injector);
+  }
+
+  private void verifyInjector(Injector injector) throws IOException
+  {
+    // Guice module did its thing
+    assertTrue(injector.getInstance(MockInterface.class) instanceof MockComponent);
+
+    // And that the Druid module set up Jackson.
+    String json = "{\"type\": \"extn\"}";
+    ObjectMapper om = injector.getInstance(Key.get(ObjectMapper.class, Json.class));
+    MockObject obj = om.readValue(json, MockObject.class);
+    assertTrue(obj instanceof MockObjectExtension);
+  }
+
+  /**
+   * Test the ability to pass module classes rather than instances.
+   */
+  @Test
+  public void testAddInputClasses() throws IOException
+  {
+    Properties props = new Properties();
+    props.put("foo", "bar");
+    Injector injector = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withProperties(props)
+          .build()
+    )
+        .addInput(MockGuiceModule.class)
+        .addInput(MockDruidModule.class)
+        .build();
+
+    // Can't verify injection here, sadly
+
+    verifyInjector(injector);
+  }
+
+  @Test
+  public void testBadModule()
+  {
+    DruidInjectorBuilder builder = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withEmptyProperties()
+          .build()
+    );
+    assertThrows(ISE.class, () -> builder.addInput("I'm not a module"));
+  }
+
+  @Test
+  public void testBadModuleClass()
+  {
+    DruidInjectorBuilder builder = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withEmptyProperties()
+          .build()
+    );
+    assertThrows(ISE.class, () -> builder.addInput(Object.class));
+  }
+
+  @Test
+  public void testAddModules() throws IOException
+  {
+    Injector injector = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withEmptyProperties()
+          .build()
+    )
+        .addModules(new MockGuiceModule(), new MockDruidModule())
+        .build();
+
+    verifyInjector(injector);
+  }
+
+  @Test
+  public void testAddAll() throws IOException
+  {
+    Injector injector = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withEmptyProperties()
+          .build()
+    )
+        .addAll(Arrays.asList(new MockGuiceModule(), new MockDruidModule()))
+        .build();
+
+    verifyInjector(injector);
+  }
+
+  /**
+   * Enable extensions. Then, exclude our JSON test module. As a result, the
+   * JSON object will fail to deserialize.
+   */
+  @Test
+  public void testExclude()
+  {
+    Properties props = new Properties();
+    props.put(ModulesConfig.PROPERTY_BASE + ".excludeList", "[\"" + MockDruidModule.class.getName() + "\"]");
+    Injector injector = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .withExtensions()
+          .withProperties(props)
+          .build()
+    )
+        .addInput(MockGuiceModule.class)
+        .addInput(MockDruidModule.class)
+        .build();
+
+    assertThrows(IOException.class, () -> verifyInjector(injector));
+  }
+
+  @Test
+  public void testMatchingNodeRole() throws IOException
+  {
+    Injector injector = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withEmptyProperties()
+          .build(),
+        ImmutableSet.of(NodeRole.BROKER)
+    )
+        .addModules(new MockGuiceModule(), new MockRoleModule())
+        .build();
+
+    verifyInjector(injector);
+  }
+
+  @Test
+  public void testNotMatchingNodeRole()
+  {
+    Injector injector = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withEmptyProperties()
+          .build(),
+        ImmutableSet.of(NodeRole.COORDINATOR)
+    )
+        .addModules(new MockGuiceModule(), new MockRoleModule())
+        .build();
+
+    assertThrows(IOException.class, () -> verifyInjector(injector));
+  }
+
+  @Test
+  public void testIgnoreNodeRole() throws IOException
+  {
+    Injector injector = new CoreInjectorBuilder(
+        new StartupInjectorBuilder()
+          .forTests()
+          .withEmptyProperties()
+          .build(),
+        ImmutableSet.of(NodeRole.COORDINATOR)
+    )
+        .ignoreLoadScopes()
+        .addModules(new MockGuiceModule(), new MockRoleModule())
+        .build();
+
+    verifyInjector(injector);
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/guice/StorageNodeModuleTest.java b/server/src/test/java/org/apache/druid/guice/StorageNodeModuleTest.java
index e849bb6910e8..082361a1c885 100644
--- a/server/src/test/java/org/apache/druid/guice/StorageNodeModuleTest.java
+++ b/server/src/test/java/org/apache/druid/guice/StorageNodeModuleTest.java
@@ -112,7 +112,7 @@ public void getDataNodeServiceWithNoServerTypeConfigShouldThrowProvisionExceptio
   public void getDataNodeServiceWithNoSegmentCacheConfiguredThrowProvisionException()
   {
     exceptionRule.expect(ProvisionException.class);
-    exceptionRule.expectMessage("Segment cache locations must be set on historicals.");
+    exceptionRule.expectMessage("druid.segmentCache.locations must be set on historicals.");
     Mockito.doReturn(ServerType.HISTORICAL).when(serverTypeConfig).getServerType();
     mockSegmentCacheNotConfigured();
     injector.getInstance(DataNodeService.class);
diff --git a/server/src/test/java/org/apache/druid/indexing/overlord/SegmentCreateRequestTest.java b/server/src/test/java/org/apache/druid/indexing/overlord/SegmentCreateRequestTest.java
new file mode 100644
index 000000000000..33641a8417da
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/indexing/overlord/SegmentCreateRequestTest.java
@@ -0,0 +1,46 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.indexing.overlord;
+
+import org.apache.druid.timeline.partition.NumberedPartialShardSpec;
+import org.apache.druid.timeline.partition.PartialShardSpec;
+import org.junit.Assert;
+import org.junit.Test;
+
+public class SegmentCreateRequestTest
+{
+
+  @Test
+  public void testNullPreviousSegmentId()
+  {
+    final PartialShardSpec partialShardSpec = NumberedPartialShardSpec.instance();
+    SegmentCreateRequest request = new SegmentCreateRequest(
+        "sequence",
+        null,
+        "version",
+        partialShardSpec
+    );
+    Assert.assertEquals("sequence", request.getSequenceName());
+    Assert.assertEquals("", request.getPreviousSegmentId());
+    Assert.assertEquals("version", request.getVersion());
+    Assert.assertEquals(partialShardSpec, request.getPartialShardSpec());
+  }
+
+}
diff --git a/server/src/test/java/org/apache/druid/initialization/SwitchingEmitterModuleTest.java b/server/src/test/java/org/apache/druid/initialization/SwitchingEmitterModuleTest.java
new file mode 100644
index 000000000000..94280aed1d7f
--- /dev/null
+++ b/server/src/test/java/org/apache/druid/initialization/SwitchingEmitterModuleTest.java
@@ -0,0 +1,114 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.initialization;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+import com.google.inject.Binder;
+import com.google.inject.Guice;
+import com.google.inject.Injector;
+import com.google.inject.Key;
+import com.google.inject.Module;
+import com.google.inject.name.Names;
+import org.apache.druid.guice.DruidGuiceExtensions;
+import org.apache.druid.guice.LifecycleModule;
+import org.apache.druid.jackson.JacksonModule;
+import org.apache.druid.java.util.emitter.core.Emitter;
+import org.apache.druid.server.emitter.SwitchingEmitterConfig;
+import org.apache.druid.server.emitter.SwitchingEmitterModule;
+import org.easymock.EasyMock;
+import org.junit.Before;
+import org.junit.Test;
+
+import javax.validation.Validation;
+import javax.validation.Validator;
+import java.util.Properties;
+
+public class SwitchingEmitterModuleTest
+{
+
+  private static final String DEFAULT_EMITTER_TYPE = "http";
+  private static final String FEED_1_EMITTER_TYPE = "logging";
+  private static final String FEED_1 = "metrics";
+  private Emitter defaultEmitter;
+  private Emitter feed1Emitter;
+
+  @Before
+  public void setup()
+  {
+    defaultEmitter = EasyMock.createMock(Emitter.class);
+    feed1Emitter = EasyMock.createMock(Emitter.class);
+    defaultEmitter.start();
+    feed1Emitter.start();
+    EasyMock.replay(defaultEmitter);
+    EasyMock.replay(feed1Emitter);
+  }
+
+  @Test
+  public void testGetEmitter()
+  {
+    SwitchingEmitterConfig config = EasyMock.createMock(SwitchingEmitterConfig.class);
+    EasyMock.expect(config.getDefaultEmitter()).andReturn(ImmutableList.of(DEFAULT_EMITTER_TYPE)).anyTimes();
+    EasyMock.expect(config.getEmitters()).andReturn(ImmutableMap.of(FEED_1, ImmutableList.of(FEED_1_EMITTER_TYPE))).anyTimes();
+
+    Injector injector = EasyMock.createMock(Injector.class);
+    EasyMock.expect(injector.getInstance(Key.get(Emitter.class, Names.named(DEFAULT_EMITTER_TYPE)))).andReturn(
+        defaultEmitter);
+    EasyMock.expect(injector.getInstance(Key.get(Emitter.class, Names.named(FEED_1_EMITTER_TYPE)))).andReturn(
+        feed1Emitter);
+    EasyMock.replay(config, injector);
+
+    Emitter switchingEmitter = new SwitchingEmitterModule().makeEmitter(config, injector);
+    switchingEmitter.start();
+
+    EasyMock.verify(config, defaultEmitter, feed1Emitter, injector);
+  }
+
+  @Test
+  public void testGetEmitterViaRealGuice()
+  {
+    Injector injector = Guice.createInjector(
+        new DruidGuiceExtensions(),
+        new LifecycleModule(),
+        new JacksonModule(),
+        new Module()
+        {
+          @Override
+          public void configure(Binder binder)
+          {
+            Properties props = new Properties();
+            String defaultEmittersValue = "[\"" + DEFAULT_EMITTER_TYPE + "\"]";
+            String emittersValue = "{\"" + FEED_1 + "\":[\"" + FEED_1_EMITTER_TYPE + "\"]}";
+            props.put("druid.emitter.switching.defaultEmitters", defaultEmittersValue);
+            props.put("druid.emitter.switching.emitters", emittersValue);
+            binder.bind(Properties.class).toInstance(props);
+            binder.bind(Validator.class).toInstance(Validation.buildDefaultValidatorFactory().getValidator());
+            binder.bind(Emitter.class).annotatedWith(Names.named(DEFAULT_EMITTER_TYPE)).toInstance(defaultEmitter);
+            binder.bind(Emitter.class).annotatedWith(Names.named(FEED_1_EMITTER_TYPE)).toInstance(feed1Emitter);
+          }
+        },
+        new SwitchingEmitterModule()
+    );
+    injector.getInstance(Key.get(Emitter.class, Names.named("switching"))).start();
+    EasyMock.verify(defaultEmitter);
+    EasyMock.verify(feed1Emitter);
+
+  }
+}
diff --git a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
index d7000f8f4d20..f7af9611e51a 100644
--- a/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
+++ b/server/src/test/java/org/apache/druid/metadata/IndexerSQLMetadataStorageCoordinatorTest.java
@@ -27,6 +27,7 @@
 import org.apache.druid.data.input.StringTuple;
 import org.apache.druid.indexing.overlord.DataSourceMetadata;
 import org.apache.druid.indexing.overlord.ObjectMetadata;
+import org.apache.druid.indexing.overlord.SegmentCreateRequest;
 import org.apache.druid.indexing.overlord.SegmentPublishResult;
 import org.apache.druid.indexing.overlord.Segments;
 import org.apache.druid.java.util.common.DateTimes;
@@ -59,7 +60,6 @@
 import org.junit.rules.ExpectedException;
 import org.skife.jdbi.v2.Handle;
 import org.skife.jdbi.v2.PreparedBatch;
-import org.skife.jdbi.v2.tweak.HandleCallback;
 import org.skife.jdbi.v2.util.StringMapper;
 
 import java.io.IOException;
@@ -371,40 +371,12 @@ private void markAllSegmentsUnused(Set<DataSegment> segments)
       Assert.assertEquals(
           1,
           (int) derbyConnector.getDBI().<Integer>withHandle(
-              new HandleCallback<Integer>()
-              {
-                @Override
-                public Integer withHandle(Handle handle)
-                {
-                  String request = StringUtils.format(
-                      "UPDATE %s SET used = false WHERE id = :id",
-                      derbyConnectorRule.metadataTablesConfigSupplier().get().getSegmentsTable()
-                  );
-                  return handle.createStatement(request).bind("id", segment.getId().toString()).execute();
-                }
-              }
-          )
-      );
-    }
-  }
-
-  private void markAllSegmentsUsed(Set<DataSegment> segments)
-  {
-    for (final DataSegment segment : segments) {
-      Assert.assertEquals(
-          1,
-          (int) derbyConnector.getDBI().<Integer>withHandle(
-              new HandleCallback<Integer>()
-              {
-                @Override
-                public Integer withHandle(Handle handle)
-                {
-                  String request = StringUtils.format(
-                      "UPDATE %s SET used = true WHERE id = :id",
-                      derbyConnectorRule.metadataTablesConfigSupplier().get().getSegmentsTable()
-                  );
-                  return handle.createStatement(request).bind("id", segment.getId().toString()).execute();
-                }
+              handle -> {
+                String request = StringUtils.format(
+                    "UPDATE %s SET used = false WHERE id = :id",
+                    derbyConnectorRule.metadataTablesConfigSupplier().get().getSegmentsTable()
+                );
+                return handle.createStatement(request).bind("id", segment.getId().toString()).execute();
               }
           )
       );
@@ -415,32 +387,19 @@ private List<String> retrievePendingSegmentIds()
   {
     final String table = derbyConnectorRule.metadataTablesConfigSupplier().get().getPendingSegmentsTable();
     return derbyConnector.retryWithHandle(
-        new HandleCallback<List<String>>()
-        {
-          @Override
-          public List<String> withHandle(Handle handle)
-          {
-            return handle.createQuery("SELECT id FROM " + table + "  ORDER BY id")
-                         .map(StringMapper.FIRST)
-                         .list();
-          }
-        }
+        handle -> handle.createQuery("SELECT id FROM " + table + "  ORDER BY id")
+                        .map(StringMapper.FIRST)
+                        .list()
     );
   }
+
   private List<String> retrieveUsedSegmentIds()
   {
     final String table = derbyConnectorRule.metadataTablesConfigSupplier().get().getSegmentsTable();
     return derbyConnector.retryWithHandle(
-        new HandleCallback<List<String>>()
-        {
-          @Override
-          public List<String> withHandle(Handle handle)
-          {
-            return handle.createQuery("SELECT id FROM " + table + " WHERE used = true ORDER BY id")
-                         .map(StringMapper.FIRST)
-                         .list();
-          }
-        }
+        handle -> handle.createQuery("SELECT id FROM " + table + " WHERE used = true ORDER BY id")
+                        .map(StringMapper.FIRST)
+                        .list()
     );
   }
 
@@ -448,16 +407,9 @@ private List<String> retrieveUnusedSegmentIds()
   {
     final String table = derbyConnectorRule.metadataTablesConfigSupplier().get().getSegmentsTable();
     return derbyConnector.retryWithHandle(
-        new HandleCallback<List<String>>()
-        {
-          @Override
-          public List<String> withHandle(Handle handle)
-          {
-            return handle.createQuery("SELECT id FROM " + table + " WHERE used = false ORDER BY id")
-                         .map(StringMapper.FIRST)
-                         .list();
-          }
-        }
+        handle -> handle.createQuery("SELECT id FROM " + table + " WHERE used = false ORDER BY id")
+                        .map(StringMapper.FIRST)
+                        .list()
     );
   }
 
@@ -466,39 +418,34 @@ private Boolean insertUsedSegments(Set<DataSegment> dataSegments)
   {
     final String table = derbyConnectorRule.metadataTablesConfigSupplier().get().getSegmentsTable();
     return derbyConnector.retryWithHandle(
-        new HandleCallback<Boolean>()
-        {
-          @Override
-          public Boolean withHandle(Handle handle) throws Exception
-          {
-            PreparedBatch preparedBatch = handle.prepareBatch(
-                StringUtils.format(
-                    "INSERT INTO %1$s (id, dataSource, created_date, start, %2$send%2$s, partitioned, version, used, payload) "
-                    + "VALUES (:id, :dataSource, :created_date, :start, :end, :partitioned, :version, :used, :payload)",
-                    table,
-                    derbyConnector.getQuoteString()
-                )
-            );
-            for (DataSegment segment : dataSegments) {
-              preparedBatch.add()
-                           .bind("id", segment.getId().toString())
-                           .bind("dataSource", segment.getDataSource())
-                           .bind("created_date", DateTimes.nowUtc().toString())
-                           .bind("start", segment.getInterval().getStart().toString())
-                           .bind("end", segment.getInterval().getEnd().toString())
-                           .bind("partitioned", (segment.getShardSpec() instanceof NoneShardSpec) ? false : true)
-                           .bind("version", segment.getVersion())
-                           .bind("used", true)
-                           .bind("payload", mapper.writeValueAsBytes(segment));
-            }
-
-            final int[] affectedRows = preparedBatch.execute();
-            final boolean succeeded = Arrays.stream(affectedRows).allMatch(eachAffectedRows -> eachAffectedRows == 1);
-            if (!succeeded) {
-              throw new ISE("Failed to publish segments to DB");
-            }
-            return true;
+        handle -> {
+          PreparedBatch preparedBatch = handle.prepareBatch(
+              StringUtils.format(
+                  "INSERT INTO %1$s (id, dataSource, created_date, start, %2$send%2$s, partitioned, version, used, payload) "
+                  + "VALUES (:id, :dataSource, :created_date, :start, :end, :partitioned, :version, :used, :payload)",
+                  table,
+                  derbyConnector.getQuoteString()
+              )
+          );
+          for (DataSegment segment : dataSegments) {
+            preparedBatch.add()
+                         .bind("id", segment.getId().toString())
+                         .bind("dataSource", segment.getDataSource())
+                         .bind("created_date", DateTimes.nowUtc().toString())
+                         .bind("start", segment.getInterval().getStart().toString())
+                         .bind("end", segment.getInterval().getEnd().toString())
+                         .bind("partitioned", !(segment.getShardSpec() instanceof NoneShardSpec))
+                         .bind("version", segment.getVersion())
+                         .bind("used", true)
+                         .bind("payload", mapper.writeValueAsBytes(segment));
           }
+
+          final int[] affectedRows = preparedBatch.execute();
+          final boolean succeeded = Arrays.stream(affectedRows).allMatch(eachAffectedRows -> eachAffectedRows == 1);
+          if (!succeeded) {
+            throw new ISE("Failed to publish segments to DB");
+          }
+          return true;
         }
     );
   }
@@ -561,12 +508,12 @@ public void testAnnounceHistoricalSegments() throws IOException
       );
     }
 
-    List<String> segmentIds = segments.stream().map(segment -> segment.getId().toString()).collect(Collectors.toList());
-    segmentIds.sort(Comparator.naturalOrder());
-    Assert.assertEquals(
-        segmentIds,
-        retrieveUsedSegmentIds()
-    );
+    List<String> segmentIds = segments.stream()
+                                      .map(segment -> segment.getId().toString())
+                                      .sorted(Comparator.naturalOrder())
+                                      .collect(Collectors.toList());
+
+    Assert.assertEquals(segmentIds, retrieveUsedSegmentIds());
 
     // Should not update dataSource metadata.
     Assert.assertEquals(0, metadataUpdateCounter.get());
@@ -823,10 +770,7 @@ public void testTransactionalAnnounceFailSegmentDropFailWithRetry() throws IOExc
         retrieveUsedSegmentIds()
     );
 
-    DataSegment nonExistingSegment = defaultSegment4;
-
-    Set<DataSegment> dropSegments = ImmutableSet.of(existingSegment1, nonExistingSegment);
-
+    Set<DataSegment> dropSegments = ImmutableSet.of(existingSegment1, defaultSegment4);
     final SegmentPublishResult result1 = coordinator.announceHistoricalSegments(
         SEGMENTS,
         dropSegments,
@@ -1576,17 +1520,19 @@ public void testAllocatePendingSegment()
   }
 
   /**
-   * This test simulates an issue detected on the field consisting of the following sequence of events:
-   * - A kafka stream segment was created on a given interval
-   * - Later, after the above was published, another segment on same interval was created by the stream
-   * - Later, after the above was published, another segment on same interval was created by the stream
-   * - Later a compaction was issued for the three segments above
-   * - Later, after the above was published, another segment on same interval was created by the stream
-   * - Later, the compacted segment got dropped due to a drop rule
+   * This test verifies the behaviour in the following sequence of events:
+   * - create segment1 for an interval and publish
+   * - create segment2 for same interval and publish
+   * - create segment3 for same interval and publish
+   * - compact all segments above and publish new segments
+   * - create segment4 for the same interval
+   * - drop the compacted segment
+   * - create segment5 for the same interval
+   * - verify that the id for segment5 is correct
    * - Later, after the above was dropped, another segment on same interval was created by the stream but this
-   *   time there was an integrity violation in the pending segments table because the
-   *   {@link IndexerSQLMetadataStorageCoordinator#createNewSegment(Handle, String, Interval, PartialShardSpec, String)}
-   *   method returned an segment id that already existed in the pending segments table
+   * time there was an integrity violation in the pending segments table because the
+   * {@link IndexerSQLMetadataStorageCoordinator#createNewSegment(Handle, String, Interval, PartialShardSpec, String)}
+   * method returned an segment id that already existed in the pending segments table
    */
   @Test
   public void testAllocatePendingSegmentAfterDroppingExistingSegment()
@@ -1690,13 +1636,13 @@ public void testAllocatePendingSegmentAfterDroppingExistingSegment()
 
   /**
    * Slightly different that the above test but that involves reverted compaction
-   1) used segments of version = A, id = 0, 1, 2
-   2) overwrote segments of version = B, id = 0 <= compaction
-   3) marked segments unused for version = A, id = 0, 1, 2 <= overshadowing
-   4) pending segment of version = B, id = 1 <= appending new data, aborted
-   5) reverted compaction, mark segments used for version = A, id = 0, 1, 2, and mark compacted segments unused
-   6) used segments of version = A, id = 0, 1, 2
-   7) pending segment of version = B, id = 1
+   * 1) used segments of version = A, id = 0, 1, 2
+   * 2) overwrote segments of version = B, id = 0 <= compaction
+   * 3) marked segments unused for version = A, id = 0, 1, 2 <= overshadowing
+   * 4) pending segment of version = B, id = 1 <= appending new data, aborted
+   * 5) reverted compaction, mark segments used for version = A, id = 0, 1, 2, and mark compacted segments unused
+   * 6) used segments of version = A, id = 0, 1, 2
+   * 7) pending segment of version = B, id = 1
    */
   @Test
   public void testAnotherAllocatePendingSegmentAfterRevertingCompaction()
@@ -1842,13 +1788,13 @@ public void testAnotherAllocatePendingSegmentAfterRevertingCompaction()
     //        used segment: version = A, id = 0,1,2
     //        unused segment: version = B, id = 0
     List<String> pendings = retrievePendingSegmentIds();
-    Assert.assertTrue(pendings.size() == 4);
+    Assert.assertEquals(4, pendings.size());
 
     List<String> used = retrieveUsedSegmentIds();
-    Assert.assertTrue(used.size() == 3);
+    Assert.assertEquals(3, used.size());
 
     List<String> unused = retrieveUnusedSegmentIds();
-    Assert.assertTrue(unused.size() == 1);
+    Assert.assertEquals(1, unused.size());
 
     // Simulate one more append load
     final SegmentIdWithShardSpec identifier4 = coordinator.allocatePendingSegment(
@@ -1886,7 +1832,71 @@ public void testAnotherAllocatePendingSegmentAfterRevertingCompaction()
     Assert.assertEquals("ds_2017-01-01T00:00:00.000Z_2017-02-01T00:00:00.000Z_A_3", ids.get(3));
 
   }
-  
+
+  @Test
+  public void testAllocatePendingSegments()
+  {
+    final PartialShardSpec partialShardSpec = NumberedPartialShardSpec.instance();
+    final String dataSource = "ds";
+    final Interval interval = Intervals.of("2017-01-01/2017-02-01");
+    final String sequenceName = "seq";
+
+    final SegmentCreateRequest request = new SegmentCreateRequest(sequenceName, null, "v1", partialShardSpec);
+    final SegmentIdWithShardSpec segmentId0 = coordinator.allocatePendingSegments(
+        dataSource,
+        interval,
+        false,
+        Collections.singletonList(request)
+    ).get(request);
+
+    Assert.assertEquals("ds_2017-01-01T00:00:00.000Z_2017-02-01T00:00:00.000Z_v1", segmentId0.toString());
+
+    final SegmentCreateRequest request1 =
+        new SegmentCreateRequest(sequenceName, segmentId0.toString(), segmentId0.getVersion(), partialShardSpec);
+    final SegmentIdWithShardSpec segmentId1 = coordinator.allocatePendingSegments(
+        dataSource,
+        interval,
+        false,
+        Collections.singletonList(request1)
+    ).get(request1);
+
+    Assert.assertEquals("ds_2017-01-01T00:00:00.000Z_2017-02-01T00:00:00.000Z_v1_1", segmentId1.toString());
+
+    final SegmentCreateRequest request2 =
+        new SegmentCreateRequest(sequenceName, segmentId1.toString(), segmentId1.getVersion(), partialShardSpec);
+    final SegmentIdWithShardSpec segmentId2 = coordinator.allocatePendingSegments(
+        dataSource,
+        interval,
+        false,
+        Collections.singletonList(request2)
+    ).get(request2);
+
+    Assert.assertEquals("ds_2017-01-01T00:00:00.000Z_2017-02-01T00:00:00.000Z_v1_2", segmentId2.toString());
+
+    final SegmentCreateRequest request3 =
+        new SegmentCreateRequest(sequenceName, segmentId1.toString(), segmentId1.getVersion(), partialShardSpec);
+    final SegmentIdWithShardSpec segmentId3 = coordinator.allocatePendingSegments(
+        dataSource,
+        interval,
+        false,
+        Collections.singletonList(request3)
+    ).get(request3);
+
+    Assert.assertEquals("ds_2017-01-01T00:00:00.000Z_2017-02-01T00:00:00.000Z_v1_2", segmentId3.toString());
+    Assert.assertEquals(segmentId2, segmentId3);
+
+    final SegmentCreateRequest request4 =
+        new SegmentCreateRequest("seq1", null, "v1", partialShardSpec);
+    final SegmentIdWithShardSpec segmentId4 = coordinator.allocatePendingSegments(
+        dataSource,
+        interval,
+        false,
+        Collections.singletonList(request4)
+    ).get(request4);
+
+    Assert.assertEquals("ds_2017-01-01T00:00:00.000Z_2017-02-01T00:00:00.000Z_v1_3", segmentId4.toString());
+  }
+
   @Test
   public void testNoPendingSegmentsAndOneUsedSegment()
   {
@@ -1923,9 +1933,8 @@ public void testNoPendingSegmentsAndOneUsedSegment()
         true
     );
     Assert.assertEquals("ds_2017-01-01T00:00:00.000Z_2017-02-01T00:00:00.000Z_A_1", identifier.toString());
-    
-  }
 
+  }
 
 
   @Test
diff --git a/server/src/test/java/org/apache/druid/rpc/ServiceClientImplTest.java b/server/src/test/java/org/apache/druid/rpc/ServiceClientImplTest.java
index 48f922e6ab6b..dc8bba87d139 100644
--- a/server/src/test/java/org/apache/druid/rpc/ServiceClientImplTest.java
+++ b/server/src/test/java/org/apache/druid/rpc/ServiceClientImplTest.java
@@ -67,6 +67,9 @@ public class ServiceClientImplTest
   private static final String SERVICE_NAME = "test-service";
   private static final ServiceLocation SERVER1 = new ServiceLocation("example.com", -1, 8888, "/q");
   private static final ServiceLocation SERVER2 = new ServiceLocation("example.com", -1, 9999, "/q");
+  private static final ServiceLocation SERVER3 = new ServiceLocation("example.com", -1, 1111, "/q");
+  private static final ServiceLocation SERVER4 = new ServiceLocation("example.com", -1, 2222, "/q");
+  private static final ServiceLocation SERVER5 = new ServiceLocation("example.com", -1, 3333, "/q");
 
   private ScheduledExecutorService exec;
 
@@ -270,7 +273,63 @@ public void test_request_followRedirect() throws Exception
   }
 
   @Test
-  public void test_request_tooManyRedirects()
+  public void test_request_tooLongRedirectChain()
+  {
+    final RequestBuilder requestBuilder = new RequestBuilder(HttpMethod.GET, "/foo");
+
+    // Redirect chain longer than max length.
+    stubLocatorCall(locations(SERVER1, SERVER2, SERVER3, SERVER4, SERVER5));
+    expectHttpCall(requestBuilder, SERVER1)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER2).getUrl().toString()));
+    expectHttpCall(requestBuilder, SERVER2)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER3).getUrl().toString()));
+    expectHttpCall(requestBuilder, SERVER3)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER4).getUrl().toString()));
+    expectHttpCall(requestBuilder, SERVER4)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER5).getUrl().toString()));
+
+    serviceClient = makeServiceClient(StandardRetryPolicy.noRetries());
+
+    final ExecutionException e = Assert.assertThrows(
+        ExecutionException.class,
+        () -> doRequest(serviceClient, requestBuilder)
+    );
+
+    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(ServiceNotAvailableException.class));
+    MatcherAssert.assertThat(
+        e.getCause(),
+        ThrowableMessageMatcher.hasMessage(CoreMatchers.containsString("issued too many redirects"))
+    );
+  }
+
+  @Test
+  public void test_request_tooLongRedirectChainRetry() throws Exception
+  {
+    final RequestBuilder requestBuilder = new RequestBuilder(HttpMethod.GET, "/foo");
+    final ImmutableMap<String, String> expectedResponseObject = ImmutableMap.of("foo", "bar");
+
+    // Redirect chain longer than max length. Can be followed across retries.
+    stubLocatorCall(locations(SERVER1, SERVER2, SERVER3, SERVER4, SERVER5));
+    expectHttpCall(requestBuilder, SERVER1)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER2).getUrl().toString()));
+    expectHttpCall(requestBuilder, SERVER2)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER3).getUrl().toString()));
+    expectHttpCall(requestBuilder, SERVER3)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER4).getUrl().toString()));
+    expectHttpCall(requestBuilder, SERVER4)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER5).getUrl().toString()));
+    expectHttpCall(requestBuilder, SERVER5)
+        .thenReturn(valueResponse(expectedResponseObject));
+
+    serviceClient = makeServiceClient(StandardRetryPolicy.builder().maxAttempts(2).build());
+
+    final Map<String, String> response = doRequest(serviceClient, requestBuilder);
+
+    Assert.assertEquals(expectedResponseObject, response);
+  }
+
+  @Test
+  public void test_request_selfRedirectLoop()
   {
     final RequestBuilder requestBuilder = new RequestBuilder(HttpMethod.GET, "/foo");
 
@@ -279,17 +338,43 @@ public void test_request_tooManyRedirects()
     expectHttpCall(requestBuilder, SERVER1)
         .thenReturn(redirectResponse(requestBuilder.build(SERVER1).getUrl().toString()));
 
-    serviceClient = makeServiceClient(StandardRetryPolicy.unlimited());
+    serviceClient = makeServiceClient(StandardRetryPolicy.builder().maxAttempts(10).build());
 
     final ExecutionException e = Assert.assertThrows(
         ExecutionException.class,
         () -> doRequest(serviceClient, requestBuilder)
     );
 
-    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(RpcException.class));
+    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(ServiceNotAvailableException.class));
     MatcherAssert.assertThat(
         e.getCause(),
-        ThrowableMessageMatcher.hasMessage(CoreMatchers.containsString("redirected too many times"))
+        ThrowableMessageMatcher.hasMessage(CoreMatchers.containsString("issued too many redirects"))
+    );
+  }
+
+  @Test
+  public void test_request_twoServerRedirectLoop()
+  {
+    final RequestBuilder requestBuilder = new RequestBuilder(HttpMethod.GET, "/foo");
+
+    // Endless redirects between the same two servers.
+    stubLocatorCall(locations(SERVER1, SERVER2));
+    expectHttpCall(requestBuilder, SERVER1)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER2).getUrl().toString()));
+    expectHttpCall(requestBuilder, SERVER2)
+        .thenReturn(redirectResponse(requestBuilder.build(SERVER1).getUrl().toString()));
+
+    serviceClient = makeServiceClient(StandardRetryPolicy.builder().maxAttempts(10).build());
+
+    final ExecutionException e = Assert.assertThrows(
+        ExecutionException.class,
+        () -> doRequest(serviceClient, requestBuilder)
+    );
+
+    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(ServiceNotAvailableException.class));
+    MatcherAssert.assertThat(
+        e.getCause(),
+        ThrowableMessageMatcher.hasMessage(CoreMatchers.containsString("issued too many redirects"))
     );
   }
 
@@ -314,7 +399,7 @@ public void test_request_redirectInvalid()
     MatcherAssert.assertThat(
         e.getCause(),
         ThrowableMessageMatcher.hasMessage(
-            CoreMatchers.containsString("redirected [0] times to invalid URL [invalid-url]"))
+            CoreMatchers.containsString("redirected to invalid URL [invalid-url]"))
     );
   }
 
@@ -338,7 +423,7 @@ public void test_request_redirectNil()
     MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(RpcException.class));
     MatcherAssert.assertThat(
         e.getCause(),
-        ThrowableMessageMatcher.hasMessage(CoreMatchers.containsString("redirected [0] times to invalid URL [null]"))
+        ThrowableMessageMatcher.hasMessage(CoreMatchers.containsString("redirected to invalid URL [null]"))
     );
   }
 
@@ -359,10 +444,11 @@ public void test_request_dontFollowRedirectToUnknownServer()
         () -> doRequest(serviceClient, requestBuilder)
     );
 
-    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(RpcException.class));
+    MatcherAssert.assertThat(e.getCause(), CoreMatchers.instanceOf(ServiceNotAvailableException.class));
     MatcherAssert.assertThat(
         e.getCause(),
-        ThrowableMessageMatcher.hasMessage(CoreMatchers.containsString("redirected too many times"))
+        ThrowableMessageMatcher.hasMessage(CoreMatchers.containsString(
+            "issued redirect to unknown URL [https://example.com:9999/q/foo]"))
     );
   }
 
diff --git a/server/src/test/java/org/apache/druid/server/ClientQuerySegmentWalkerTest.java b/server/src/test/java/org/apache/druid/server/ClientQuerySegmentWalkerTest.java
index 5e0701680cd0..967d9342d78f 100644
--- a/server/src/test/java/org/apache/druid/server/ClientQuerySegmentWalkerTest.java
+++ b/server/src/test/java/org/apache/druid/server/ClientQuerySegmentWalkerTest.java
@@ -1391,7 +1391,6 @@ public <T> QueryRunner<T> getQueryRunnerForSegments(Query<T> query, Iterable<Seg
                     .put(ARRAY, makeTimeline(ARRAY, ARRAY_INLINE))
                     .put(ARRAY_UNKNOWN, makeTimeline(ARRAY_UNKNOWN, ARRAY_INLINE_UNKNOWN))
                     .build(),
-                joinableFactoryWrapper,
                 conglomerate,
                 schedulerForTest
             ),
diff --git a/server/src/test/java/org/apache/druid/server/QueryStackTests.java b/server/src/test/java/org/apache/druid/server/QueryStackTests.java
index a53589d120f4..7011a0283df2 100644
--- a/server/src/test/java/org/apache/druid/server/QueryStackTests.java
+++ b/server/src/test/java/org/apache/druid/server/QueryStackTests.java
@@ -50,6 +50,8 @@
 import org.apache.druid.query.metadata.SegmentMetadataQueryQueryToolChest;
 import org.apache.druid.query.metadata.SegmentMetadataQueryRunnerFactory;
 import org.apache.druid.query.metadata.metadata.SegmentMetadataQuery;
+import org.apache.druid.query.operator.WindowOperatorQuery;
+import org.apache.druid.query.operator.WindowOperatorQueryQueryRunnerFactory;
 import org.apache.druid.query.scan.ScanQuery;
 import org.apache.druid.query.scan.ScanQueryConfig;
 import org.apache.druid.query.scan.ScanQueryEngine;
@@ -160,12 +162,11 @@ public boolean isUseResultLevelCache()
 
   public static TestClusterQuerySegmentWalker createClusterQuerySegmentWalker(
       Map<String, VersionedIntervalTimeline<String, ReferenceCountingSegment>> timelines,
-      JoinableFactoryWrapper joinableFactoryWraper,
       QueryRunnerFactoryConglomerate conglomerate,
       @Nullable QueryScheduler scheduler
   )
   {
-    return new TestClusterQuerySegmentWalker(timelines, joinableFactoryWraper, conglomerate, scheduler);
+    return new TestClusterQuerySegmentWalker(timelines, conglomerate, scheduler);
   }
 
   public static LocalQuerySegmentWalker createLocalQuerySegmentWalker(
@@ -348,6 +349,7 @@ public int getMinTopNThreshold()
             )
             .put(GroupByQuery.class, groupByQueryRunnerFactory)
             .put(TimeBoundaryQuery.class, new TimeBoundaryQueryRunnerFactory(QueryRunnerTestHelper.NOOP_QUERYWATCHER))
+            .put(WindowOperatorQuery.class, new WindowOperatorQueryQueryRunnerFactory())
             .build()
     );
 
diff --git a/server/src/test/java/org/apache/druid/server/StatusResourceTest.java b/server/src/test/java/org/apache/druid/server/StatusResourceTest.java
index 52fb0c80d532..8ea8da4b78c7 100644
--- a/server/src/test/java/org/apache/druid/server/StatusResourceTest.java
+++ b/server/src/test/java/org/apache/druid/server/StatusResourceTest.java
@@ -22,9 +22,9 @@
 import com.fasterxml.jackson.core.type.TypeReference;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
-import com.google.inject.Guice;
 import com.google.inject.Injector;
 import org.apache.druid.guice.PropertiesModule;
+import org.apache.druid.guice.StartupInjectorBuilder;
 import org.apache.druid.initialization.DruidModule;
 import org.apache.druid.initialization.ServerInjectorBuilderTest;
 import org.apache.druid.java.util.common.StringUtils;
@@ -78,8 +78,9 @@ public void testHiddenPropertiesContain() throws Exception
 
   private void testHiddenPropertiesWithPropertyFileName(String fileName) throws Exception
   {
-    Injector injector = Guice.createInjector(Collections.singletonList(new PropertiesModule(Collections.singletonList(
-        fileName))));
+    Injector injector = new StartupInjectorBuilder()
+        .add(new PropertiesModule(Collections.singletonList(fileName)))
+        .build();
     Map<String, String> returnedProperties = injector.getInstance(StatusResource.class).getProperties();
     Set<String> lowerCasePropertyNames = returnedProperties.keySet()
                                                            .stream()
diff --git a/server/src/test/java/org/apache/druid/server/TestClusterQuerySegmentWalker.java b/server/src/test/java/org/apache/druid/server/TestClusterQuerySegmentWalker.java
index 2245b28169a8..000626f16e2c 100644
--- a/server/src/test/java/org/apache/druid/server/TestClusterQuerySegmentWalker.java
+++ b/server/src/test/java/org/apache/druid/server/TestClusterQuerySegmentWalker.java
@@ -45,7 +45,6 @@
 import org.apache.druid.query.spec.SpecificSegmentSpec;
 import org.apache.druid.segment.ReferenceCountingSegment;
 import org.apache.druid.segment.SegmentReference;
-import org.apache.druid.segment.join.JoinableFactoryWrapper;
 import org.apache.druid.timeline.TimelineObjectHolder;
 import org.apache.druid.timeline.VersionedIntervalTimeline;
 import org.apache.druid.timeline.partition.PartitionChunk;
@@ -71,20 +70,17 @@
 public class TestClusterQuerySegmentWalker implements QuerySegmentWalker
 {
   private final Map<String, VersionedIntervalTimeline<String, ReferenceCountingSegment>> timelines;
-  private final JoinableFactoryWrapper joinableFactoryWrapper;
   private final QueryRunnerFactoryConglomerate conglomerate;
   @Nullable
   private final QueryScheduler scheduler;
 
   TestClusterQuerySegmentWalker(
       Map<String, VersionedIntervalTimeline<String, ReferenceCountingSegment>> timelines,
-      JoinableFactoryWrapper joinableFactoryWrapper,
       QueryRunnerFactoryConglomerate conglomerate,
       @Nullable QueryScheduler scheduler
   )
   {
     this.timelines = timelines;
-    this.joinableFactoryWrapper = joinableFactoryWrapper;
     this.conglomerate = conglomerate;
     this.scheduler = scheduler;
   }
diff --git a/server/src/test/java/org/apache/druid/server/coordination/ChangeRequestHistoryTest.java b/server/src/test/java/org/apache/druid/server/coordination/ChangeRequestHistoryTest.java
index 82a67b038ed6..ecba53a8a031 100644
--- a/server/src/test/java/org/apache/druid/server/coordination/ChangeRequestHistoryTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordination/ChangeRequestHistoryTest.java
@@ -25,6 +25,7 @@
 import org.junit.Assert;
 import org.junit.Test;
 
+import java.util.concurrent.ExecutionException;
 import java.util.concurrent.Future;
 import java.util.concurrent.TimeUnit;
 import java.util.concurrent.atomic.AtomicBoolean;
@@ -171,4 +172,44 @@ public void testNonImmediateFuture() throws Exception
     Assert.assertEquals(1, snapshot.getCounter().getCounter());
     Assert.assertEquals(1, snapshot.getRequests().size());
   }
+
+  @Test
+  public void testStop()
+  {
+    final ChangeRequestHistory<DataSegmentChangeRequest> history = new ChangeRequestHistory();
+
+    ListenableFuture<ChangeRequestsSnapshot<DataSegmentChangeRequest>> future = history.getRequestsSince(
+        ChangeRequestHistory.Counter.ZERO
+    );
+    Assert.assertEquals(1, history.waitingFutures.size());
+
+    final AtomicBoolean callbackExcecuted = new AtomicBoolean(false);
+    Futures.addCallback(
+        future,
+        new FutureCallback<ChangeRequestsSnapshot<DataSegmentChangeRequest>>()
+        {
+          @Override
+          public void onSuccess(ChangeRequestsSnapshot result)
+          {
+            callbackExcecuted.set(true);
+          }
+
+          @Override
+          public void onFailure(Throwable t)
+          {
+            callbackExcecuted.set(true);
+          }
+        }
+    );
+
+    history.stop();
+    // any new change requests should be ignored, there should be no waiting futures, and open futures should be resolved
+    history.addChangeRequest(new SegmentChangeRequestNoop());
+    Assert.assertEquals(0, history.waitingFutures.size());
+    Assert.assertTrue(callbackExcecuted.get());
+    Assert.assertTrue(future.isDone());
+
+    Throwable thrown = Assert.assertThrows(ExecutionException.class, future::get);
+    Assert.assertEquals("java.lang.IllegalStateException: Server is shutting down.", thrown.getMessage());
+  }
 }
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/simulate/BalancingStrategiesTest.java b/server/src/test/java/org/apache/druid/server/coordinator/simulate/BalancingStrategiesTest.java
index fd1c6c4d0f57..f135280825e9 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/simulate/BalancingStrategiesTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/simulate/BalancingStrategiesTest.java
@@ -76,8 +76,8 @@ public void testFreshClusterGetsBalanced()
     runCoordinatorCycle();
     loadQueuedSegments();
     verifyValue(Metric.ASSIGNED_COUNT, 1000L);
-    verifyNoEvent(Metric.MOVED_COUNT);
-    verifyNoEvent(Metric.UNMOVED_COUNT);
+    verifyNotEmitted(Metric.MOVED_COUNT);
+    verifyNotEmitted(Metric.UNMOVED_COUNT);
 
     for (DruidServer historical : historicals) {
       Assert.assertEquals(200, historical.getTotalSegments());
@@ -113,8 +113,8 @@ public void testClusterGetsBalancedWhenServerIsAdded()
     runCoordinatorCycle();
     loadQueuedSegments();
     verifyValue(Metric.ASSIGNED_COUNT, 1000L);
-    verifyNoEvent(Metric.MOVED_COUNT);
-    verifyNoEvent(Metric.UNMOVED_COUNT);
+    verifyNotEmitted(Metric.MOVED_COUNT);
+    verifyNotEmitted(Metric.UNMOVED_COUNT);
 
     // Verify that each server is equally loaded
     for (DruidServer historical : historicals) {
@@ -161,8 +161,8 @@ public void testClusterGetsBalancedWhenServerIsRemoved()
     runCoordinatorCycle();
     loadQueuedSegments();
     verifyValue(Metric.ASSIGNED_COUNT, 1000L);
-    verifyNoEvent(Metric.MOVED_COUNT);
-    verifyNoEvent(Metric.UNMOVED_COUNT);
+    verifyNotEmitted(Metric.MOVED_COUNT);
+    verifyNotEmitted(Metric.UNMOVED_COUNT);
 
     // Verify that each server is equally loaded
     for (DruidServer historical : historicals) {
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulation.java b/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulation.java
index f79a9bf48041..c0565c19ba9d 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulation.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulation.java
@@ -20,7 +20,7 @@
 package org.apache.druid.server.coordinator.simulate;
 
 import org.apache.druid.client.DruidServer;
-import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
+import org.apache.druid.java.util.metrics.MetricsVerifier;
 import org.apache.druid.server.coordinator.CoordinatorDynamicConfig;
 import org.apache.druid.timeline.DataSegment;
 
@@ -81,9 +81,10 @@ interface CoordinatorState
     DruidServer getInventoryView(String serverName);
 
     /**
-     * Returns the metric events emitted in the previous coordinator run.
+     * Returns a MetricsVerifier which can be used to extract and verify the
+     * metric values emitted in the previous coordinator run.
      */
-    List<ServiceMetricEvent> getMetricEvents();
+    MetricsVerifier getMetricsVerifier();
 
     /**
      * Gets the load percentage of the specified datasource as seen by the coordinator.
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulationBaseTest.java b/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulationBaseTest.java
index d4e8b7760de0..84c6886d9d40 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulationBaseTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulationBaseTest.java
@@ -21,7 +21,7 @@
 
 import org.apache.druid.client.DruidServer;
 import org.apache.druid.java.util.common.granularity.Granularities;
-import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
+import org.apache.druid.java.util.metrics.MetricsVerifier;
 import org.apache.druid.server.coordination.ServerType;
 import org.apache.druid.server.coordinator.CoordinatorDynamicConfig;
 import org.apache.druid.server.coordinator.CreateDataSegments;
@@ -32,8 +32,6 @@
 import org.junit.Assert;
 import org.junit.Before;
 
-import java.util.ArrayList;
-import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
@@ -51,13 +49,15 @@
  * leading to flakiness in the tests. The simulation sets this field to true by
  * default.
  */
-public abstract class CoordinatorSimulationBaseTest
-    implements CoordinatorSimulation.CoordinatorState, CoordinatorSimulation.ClusterState
+public abstract class CoordinatorSimulationBaseTest implements
+    CoordinatorSimulation.CoordinatorState,
+    CoordinatorSimulation.ClusterState,
+    MetricsVerifier
 {
   static final double DOUBLE_DELTA = 10e-9;
 
   private CoordinatorSimulation sim;
-  private final Map<String, List<ServiceMetricEvent>> latestMetricEvents = new HashMap<>();
+  private MetricsVerifier metricsVerifier;
 
   @Before
   public abstract void setUp();
@@ -78,25 +78,19 @@ void startSimulation(CoordinatorSimulation simulation)
   {
     this.sim = simulation;
     simulation.start();
+    this.metricsVerifier = this.sim.coordinator().getMetricsVerifier();
   }
 
   @Override
   public void runCoordinatorCycle()
   {
-    latestMetricEvents.clear();
     sim.coordinator().runCoordinatorCycle();
-
-    // Extract the metric values of this run
-    for (ServiceMetricEvent event : sim.coordinator().getMetricEvents()) {
-      latestMetricEvents.computeIfAbsent(event.getMetric(), m -> new ArrayList<>())
-                        .add(event);
-    }
   }
 
   @Override
-  public List<ServiceMetricEvent> getMetricEvents()
+  public MetricsVerifier getMetricsVerifier()
   {
-    return sim.coordinator().getMetricEvents();
+    return null;
   }
 
   @Override
@@ -153,61 +147,13 @@ void verifyDatasourceIsFullyLoaded(String datasource)
     Assert.assertEquals(100.0, getLoadPercentage(datasource), DOUBLE_DELTA);
   }
 
-  void verifyNoEvent(String metricName)
-  {
-    Assert.assertTrue(getMetricValues(metricName, null).isEmpty());
-  }
-
-  /**
-   * Verifies the value of the specified metric emitted in the previous run.
-   */
-  void verifyValue(String metricName, Number expectedValue)
-  {
-    verifyValue(metricName, null, expectedValue);
-  }
-
-  /**
-   * Verifies the value of the event corresponding to the specified metric and
-   * dimensionFilters emitted in the previous run.
-   */
-  void verifyValue(String metricName, Map<String, String> dimensionFilters, Number expectedValue)
-  {
-    Assert.assertEquals(expectedValue, getValue(metricName, dimensionFilters));
-  }
-
-  /**
-   * Gets the value of the event corresponding to the specified metric and
-   * dimensionFilters emitted in the previous run.
-   */
-  Number getValue(String metricName, Map<String, String> dimensionFilters)
-  {
-    List<Number> values = getMetricValues(metricName, dimensionFilters);
-    Assert.assertEquals(
-        "Metric must have been emitted exactly once for the given dimensions.",
-        1,
-        values.size()
-    );
-    return values.get(0);
-  }
-
-  private List<Number> getMetricValues(String metricName, Map<String, String> dimensionFilters)
+  @Override
+  public List<Number> getMetricValues(
+      String metricName,
+      Map<String, Object> dimensionFilters
+  )
   {
-    final List<Number> values = new ArrayList<>();
-    final List<ServiceMetricEvent> events = latestMetricEvents.getOrDefault(metricName, Collections.emptyList());
-    final Map<String, String> filters = dimensionFilters == null
-                                        ? Collections.emptyMap() : dimensionFilters;
-    for (ServiceMetricEvent event : events) {
-      final Map<String, Object> userDims = event.getUserDims();
-      boolean match = filters.keySet().stream()
-                             .map(d -> filters.get(d).equals(userDims.get(d)))
-                             .reduce((a, b) -> a && b)
-                             .orElse(true);
-      if (match) {
-        values.add(event.getValue());
-      }
-    }
-
-    return values;
+    return metricsVerifier.getMetricValues(metricName, dimensionFilters);
   }
 
   // Utility methods
@@ -237,13 +183,13 @@ static CoordinatorDynamicConfig createDynamicConfig(
   /**
    * Creates a map containing dimension key-values to filter out metric events.
    */
-  static Map<String, String> filter(String... dimensionValues)
+  static Map<String, Object> filter(String... dimensionValues)
   {
     if (dimensionValues.length < 2 || dimensionValues.length % 2 == 1) {
       throw new IllegalArgumentException("Dimension key-values must be specified in pairs.");
     }
 
-    final Map<String, String> filters = new HashMap<>();
+    final Map<String, Object> filters = new HashMap<>();
     for (int i = 0; i < dimensionValues.length; ) {
       filters.put(dimensionValues[i], dimensionValues[i + 1]);
       i += 2;
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulationBuilder.java b/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulationBuilder.java
index 01308d82e73f..7066183c3ac6 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulationBuilder.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/simulate/CoordinatorSimulationBuilder.java
@@ -32,8 +32,8 @@
 import org.apache.druid.java.util.common.concurrent.ScheduledExecutorFactory;
 import org.apache.druid.java.util.common.lifecycle.Lifecycle;
 import org.apache.druid.java.util.emitter.EmittingLogger;
-import org.apache.druid.java.util.emitter.service.ServiceMetricEvent;
 import org.apache.druid.java.util.http.client.HttpClient;
+import org.apache.druid.java.util.metrics.MetricsVerifier;
 import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.apache.druid.server.coordinator.BalancerStrategyFactory;
 import org.apache.druid.server.coordinator.CachingCostBalancerStrategyConfig;
@@ -392,9 +392,9 @@ public double getLoadPercentage(String datasource)
     }
 
     @Override
-    public List<ServiceMetricEvent> getMetricEvents()
+    public MetricsVerifier getMetricsVerifier()
     {
-      return new ArrayList<>(env.serviceEmitter.getMetricEvents());
+      return env.serviceEmitter;
     }
   }
 
diff --git a/server/src/test/java/org/apache/druid/server/coordinator/simulate/SegmentLoadingTest.java b/server/src/test/java/org/apache/druid/server/coordinator/simulate/SegmentLoadingTest.java
index 1edeab8a370f..e04ebe532df5 100644
--- a/server/src/test/java/org/apache/druid/server/coordinator/simulate/SegmentLoadingTest.java
+++ b/server/src/test/java/org/apache/druid/server/coordinator/simulate/SegmentLoadingTest.java
@@ -148,7 +148,7 @@ public void testDropHappensAfterTargetReplicationOnEveryTier()
     startSimulation(sim);
     runCoordinatorCycle();
 
-    verifyNoEvent(Metric.DROPPED_COUNT);
+    verifyNotEmitted(Metric.DROPPED_COUNT);
     int totalAssignedInRun1
         = getValue(Metric.ASSIGNED_COUNT, filter(DruidMetrics.TIER, Tier.T2)).intValue()
           + getValue(Metric.ASSIGNED_COUNT, filter(DruidMetrics.TIER, Tier.T3)).intValue();
@@ -158,7 +158,7 @@ public void testDropHappensAfterTargetReplicationOnEveryTier()
     runCoordinatorCycle();
     loadQueuedSegments();
 
-    verifyNoEvent(Metric.DROPPED_COUNT);
+    verifyNotEmitted(Metric.DROPPED_COUNT);
     int totalLoadedAfterRun2
         = historicalT21.getTotalSegments() + historicalT22.getTotalSegments()
           + historicalT31.getTotalSegments() + historicalT32.getTotalSegments();
diff --git a/server/src/test/java/org/apache/druid/server/metrics/TaskCountStatsMonitorTest.java b/server/src/test/java/org/apache/druid/server/metrics/TaskCountStatsMonitorTest.java
index 24d89ab957a2..c6a47d56c427 100644
--- a/server/src/test/java/org/apache/druid/server/metrics/TaskCountStatsMonitorTest.java
+++ b/server/src/test/java/org/apache/druid/server/metrics/TaskCountStatsMonitorTest.java
@@ -75,15 +75,10 @@ public void testMonitor()
     final StubServiceEmitter emitter = new StubServiceEmitter("service", "host");
     monitor.doMonitor(emitter);
     Assert.assertEquals(5, emitter.getEvents().size());
-    Assert.assertEquals("task/success/count", emitter.getEvents().get(0).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(0).toMap().get("value"));
-    Assert.assertEquals("task/failed/count", emitter.getEvents().get(1).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(1).toMap().get("value"));
-    Assert.assertEquals("task/running/count", emitter.getEvents().get(2).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(2).toMap().get("value"));
-    Assert.assertEquals("task/pending/count", emitter.getEvents().get(3).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(3).toMap().get("value"));
-    Assert.assertEquals("task/waiting/count", emitter.getEvents().get(4).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(4).toMap().get("value"));
+    emitter.verifyValue("task/success/count", 1L);
+    emitter.verifyValue("task/failed/count", 1L);
+    emitter.verifyValue("task/running/count", 1L);
+    emitter.verifyValue("task/pending/count", 1L);
+    emitter.verifyValue("task/waiting/count", 1L);
   }
 }
diff --git a/server/src/test/java/org/apache/druid/server/metrics/TaskSlotCountStatsMonitorTest.java b/server/src/test/java/org/apache/druid/server/metrics/TaskSlotCountStatsMonitorTest.java
index be33a4c98b68..0fed1c9b6bc1 100644
--- a/server/src/test/java/org/apache/druid/server/metrics/TaskSlotCountStatsMonitorTest.java
+++ b/server/src/test/java/org/apache/druid/server/metrics/TaskSlotCountStatsMonitorTest.java
@@ -75,15 +75,10 @@ public void testMonitor()
     final StubServiceEmitter emitter = new StubServiceEmitter("service", "host");
     monitor.doMonitor(emitter);
     Assert.assertEquals(5, emitter.getEvents().size());
-    Assert.assertEquals("taskSlot/total/count", emitter.getEvents().get(0).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(0).toMap().get("value"));
-    Assert.assertEquals("taskSlot/idle/count", emitter.getEvents().get(1).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(1).toMap().get("value"));
-    Assert.assertEquals("taskSlot/used/count", emitter.getEvents().get(2).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(2).toMap().get("value"));
-    Assert.assertEquals("taskSlot/lazy/count", emitter.getEvents().get(3).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(3).toMap().get("value"));
-    Assert.assertEquals("taskSlot/blacklisted/count", emitter.getEvents().get(4).toMap().get("metric"));
-    Assert.assertEquals(1L, emitter.getEvents().get(4).toMap().get("value"));
+    emitter.verifyValue("taskSlot/total/count", 1L);
+    emitter.verifyValue("taskSlot/idle/count", 1L);
+    emitter.verifyValue("taskSlot/used/count", 1L);
+    emitter.verifyValue("taskSlot/lazy/count", 1L);
+    emitter.verifyValue("taskSlot/blacklisted/count", 1L);
   }
 }
diff --git a/server/src/test/java/org/apache/druid/server/metrics/WorkerTaskCountStatsMonitorTest.java b/server/src/test/java/org/apache/druid/server/metrics/WorkerTaskCountStatsMonitorTest.java
index 01a97b7a9a03..fadb2f988269 100644
--- a/server/src/test/java/org/apache/druid/server/metrics/WorkerTaskCountStatsMonitorTest.java
+++ b/server/src/test/java/org/apache/druid/server/metrics/WorkerTaskCountStatsMonitorTest.java
@@ -20,10 +20,10 @@
 package org.apache.druid.server.metrics;
 
 import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
 import com.google.inject.Guice;
 import com.google.inject.Injector;
-import com.google.inject.Module;
 import org.apache.druid.discovery.NodeRole;
 import org.apache.druid.java.util.metrics.StubServiceEmitter;
 import org.junit.Assert;
@@ -143,24 +143,18 @@ public String getWorkerVersion()
 
     injectorForMiddleManager = Guice.createInjector(
         ImmutableList.of(
-            (Module) binder -> {
-              binder.bind(WorkerTaskCountStatsProvider.class).toInstance(statsProvider);
-            }
+            binder -> binder.bind(WorkerTaskCountStatsProvider.class).toInstance(statsProvider)
         )
     );
 
     injectorForMiddleManagerNullStats = Guice.createInjector(
         ImmutableList.of(
-            (Module) binder -> {
-              binder.bind(WorkerTaskCountStatsProvider.class).toInstance(nullStatsProvider);
-            }
+            binder -> binder.bind(WorkerTaskCountStatsProvider.class).toInstance(nullStatsProvider)
         )
     );
 
     injectorForPeon = Guice.createInjector(
-        ImmutableList.of(
-            (Module) binder -> {}
-        )
+        ImmutableList.of(binder -> {})
     );
   }
 
@@ -172,26 +166,31 @@ public void testMonitor()
     final StubServiceEmitter emitter = new StubServiceEmitter("service", "host");
     monitor.doMonitor(emitter);
     Assert.assertEquals(5, emitter.getEvents().size());
-    Assert.assertEquals("worker/task/failed/count", emitter.getEvents().get(0).toMap().get("metric"));
-    Assert.assertEquals("workerCategory", emitter.getEvents().get(0).toMap().get("category"));
-    Assert.assertEquals("workerVersion", emitter.getEvents().get(0).toMap().get("workerVersion"));
-    Assert.assertEquals(4L, emitter.getEvents().get(0).toMap().get("value"));
-    Assert.assertEquals("worker/task/success/count", emitter.getEvents().get(1).toMap().get("metric"));
-    Assert.assertEquals("workerCategory", emitter.getEvents().get(1).toMap().get("category"));
-    Assert.assertEquals("workerVersion", emitter.getEvents().get(1).toMap().get("workerVersion"));
-    Assert.assertEquals(2L, emitter.getEvents().get(1).toMap().get("value"));
-    Assert.assertEquals("worker/taskSlot/idle/count", emitter.getEvents().get(2).toMap().get("metric"));
-    Assert.assertEquals("workerCategory", emitter.getEvents().get(2).toMap().get("category"));
-    Assert.assertEquals("workerVersion", emitter.getEvents().get(2).toMap().get("workerVersion"));
-    Assert.assertEquals(3L, emitter.getEvents().get(2).toMap().get("value"));
-    Assert.assertEquals("worker/taskSlot/total/count", emitter.getEvents().get(3).toMap().get("metric"));
-    Assert.assertEquals("workerCategory", emitter.getEvents().get(3).toMap().get("category"));
-    Assert.assertEquals("workerVersion", emitter.getEvents().get(3).toMap().get("workerVersion"));
-    Assert.assertEquals(5L, emitter.getEvents().get(3).toMap().get("value"));
-    Assert.assertEquals("worker/taskSlot/used/count", emitter.getEvents().get(4).toMap().get("metric"));
-    Assert.assertEquals("workerCategory", emitter.getEvents().get(4).toMap().get("category"));
-    Assert.assertEquals("workerVersion", emitter.getEvents().get(4).toMap().get("workerVersion"));
-    Assert.assertEquals(1L, emitter.getEvents().get(4).toMap().get("value"));
+    emitter.verifyValue(
+        "worker/task/failed/count",
+        ImmutableMap.of("category", "workerCategory", "workerVersion", "workerVersion"),
+        4L
+    );
+    emitter.verifyValue(
+        "worker/task/success/count",
+        ImmutableMap.of("category", "workerCategory", "workerVersion", "workerVersion"),
+        2L
+    );
+    emitter.verifyValue(
+        "worker/taskSlot/idle/count",
+        ImmutableMap.of("category", "workerCategory", "workerVersion", "workerVersion"),
+        3L
+    );
+    emitter.verifyValue(
+        "worker/taskSlot/total/count",
+        ImmutableMap.of("category", "workerCategory", "workerVersion", "workerVersion"),
+        5L
+    );
+    emitter.verifyValue(
+        "worker/taskSlot/used/count",
+        ImmutableMap.of("category", "workerCategory", "workerVersion", "workerVersion"),
+        1L
+    );
   }
 
   @Test
diff --git a/services/pom.xml b/services/pom.xml
index d53a7229dd6b..f5b007ba1b50 100644
--- a/services/pom.xml
+++ b/services/pom.xml
@@ -27,7 +27,7 @@
     <parent>
         <groupId>org.apache.druid</groupId>
         <artifactId>druid</artifactId>
-        <version>25.0.0-SNAPSHOT</version>
+        <version>26.0.0-SNAPSHOT</version>
     </parent>
 
     <dependencies>
diff --git a/sql/edit-parser.py b/sql/edit-parser.py
new file mode 100644
index 000000000000..c0113b3b2438
--- /dev/null
+++ b/sql/edit-parser.py
@@ -0,0 +1,134 @@
+#! /bin/python3
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ------------------------------------------------------------------------
+
+# Revise the parser to add two elements of Druid syntax to the FROM
+# clause:
+#
+# id [ (<args>) ]
+#
+# And
+#
+# TABLE(<fn>(<args>)) (<schema>)
+
+import os
+import os.path
+
+# Ensure this can run from the main pom, or within the
+# module directory.
+baseDir = ""
+if os.path.isdir("sql"):
+  baseDir = "sql/"
+source = baseDir + "target/codegen/templates/Parser.jj"
+dest = baseDir + "target/codegen/templates/DruidParser.jj"
+
+inFile = open(source)
+outFile = open(dest, "w")
+
+# Look for the rule to remove, copying lines as we go.
+while True:
+    line = inFile.readline()
+    if not line:
+        break
+    outFile.write(line)
+    if line == "SqlNode TableRef2(boolean lateral) :\n":
+        break
+
+# Find close of the rule, after the variable definitions
+while True:
+    line = inFile.readline()
+    if not line:
+        break
+    if line == "}\n":
+        break
+    outFile.write(line)
+
+outFile.write(
+'''    List<SqlNode> paramList;
+}
+''')
+
+# Find the table identifier rule
+while True:
+    line = inFile.readline()
+    if not line:
+        break
+    outFile.write(line)
+    if line == "        tableRef = CompoundIdentifier()\n":
+        break
+
+# Add the Druid parameterization
+outFile.write(
+'''        [
+            paramList = FunctionParameterList(ExprContext.ACCEPT_NONCURSOR)
+            {
+                tableRef = ParameterizeOperator.PARAM.createCall(tableRef, paramList);
+            }
+        ]
+''')
+
+# Skip over the unwanted EXTENDS clause
+while True:
+    line = inFile.readline()
+    if not line:
+        break
+    if line == "        over = TableOverOpt() {\n":
+        outFile.write(line)
+        break
+
+# Find the table function rule
+while True:
+    line = inFile.readline()
+    if not line:
+        break
+    outFile.write(line)
+    if line == "        tableRef = TableFunctionCall(s.pos())\n":
+        break
+
+# Find the closing paren
+while True:
+    line = inFile.readline()
+    if not line:
+        break
+    outFile.write(line)
+    if line == "        <RPAREN>\n":
+        break
+
+# Add the additional clause
+outFile.write(
+'''        [
+            [ <EXTEND> ]
+            extendList = ExtendList()
+            {
+                tableRef = ExtendOperator.EXTEND.createCall(
+                        Span.of(tableRef, extendList).pos(), tableRef, extendList);
+            }
+        ]
+''')
+
+# Copy everything else
+while True:
+    line = inFile.readline()
+    if not line:
+        break
+    outFile.write(line)
+
+inFile.close()
+outFile.close()
+
+# Switch the files.
+os.remove(source)
+os.rename(dest, source)
diff --git a/sql/pom.xml b/sql/pom.xml
index 28f7eecffc48..960aac9f86b1 100644
--- a/sql/pom.xml
+++ b/sql/pom.xml
@@ -18,7 +18,8 @@
   ~ under the License.
   -->
 
-<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
   <modelVersion>4.0.0</modelVersion>
 
   <artifactId>druid-sql</artifactId>
@@ -28,7 +29,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
   </parent>
 
   <dependencies>
@@ -186,6 +187,7 @@
       <scope>provided</scope>
     </dependency>
 
+
     <!-- Tests -->
     <dependency>
       <groupId>junit</groupId>
@@ -208,6 +210,11 @@
       <artifactId>easymock</artifactId>
       <scope>test</scope>
     </dependency>
+    <dependency>
+      <groupId>com.fasterxml.jackson.dataformat</groupId>
+      <artifactId>jackson-dataformat-yaml</artifactId>
+      <scope>test</scope>
+    </dependency>
     <dependency>
       <groupId>commons-io</groupId>
       <artifactId>commons-io</artifactId>
@@ -249,11 +256,11 @@
       <artifactId>mockito-core</artifactId>
       <scope>test</scope>
     </dependency>
-	<dependency>
-	  <groupId>org.jdbi</groupId>
-	  <artifactId>jdbi</artifactId>
-	  <scope>test</scope>
-	</dependency>
+    <dependency>
+      <groupId>org.jdbi</groupId>
+      <artifactId>jdbi</artifactId>
+      <scope>test</scope>
+    </dependency>
   </dependencies>
 
   <build>
@@ -278,7 +285,7 @@
         <executions>
           <execution>
             <id>unpack-parser-template</id>
-            <phase>initialize</phase>
+            <phase>generate-sources</phase>
             <goals>
               <goal>unpack</goal>
             </goals>
@@ -299,6 +306,30 @@
         </executions>
       </plugin>
 
+      <!-- Edit the parser. Add an additional clause to the table function
+           rule. This produces a new parser, DruidParser.jj.
+           -->
+      <plugin>
+        <groupId>org.codehaus.mojo</groupId>
+        <artifactId>exec-maven-plugin</artifactId>
+        <executions>
+          <execution>
+           <id>edit-parser</id>
+           <phase>generate-sources</phase>
+           <goals>
+             <goal>exec</goal>
+           </goals>
+           <configuration>
+             <executable>python3</executable>
+             <workingDirectory>${project.basedir}</workingDirectory>
+             <arguments>
+               <argument>edit-parser.py</argument>
+             </arguments>
+           </configuration>
+         </execution>
+        </executions>
+      </plugin>
+
       <!-- Copy the templates present in the codegen directory of druid-sql containing custom SQL rules to
         ${project.build.directory}/codegen -->
       <plugin>
@@ -306,7 +337,7 @@
         <executions>
           <execution>
             <id>copy-fmpp-resources</id>
-            <phase>initialize</phase>
+            <phase>generate-sources</phase>
             <goals>
               <goal>copy-resources</goal>
             </goals>
@@ -337,14 +368,14 @@
             </goals>
             <configuration>
               <cfgFile>${project.build.directory}/codegen/config.fmpp</cfgFile>
-              <outputDirectory>${project.build.directory}/generated-sources/annotations</outputDirectory>
+              <outputDirectory>${project.build.directory}/generated-sources</outputDirectory>
               <templateDirectory>${project.build.directory}/codegen/templates</templateDirectory>
             </configuration>
           </execution>
         </executions>
       </plugin>
 
-      <!-- Creates a Java class for the custom parser from the Parser.jj -->
+      <!-- Creates a Java class for the custom parser from Parser.jj -->
       <plugin>
         <groupId>org.codehaus.mojo</groupId>
         <artifactId>javacc-maven-plugin</artifactId>
@@ -356,13 +387,13 @@
               <goal>javacc</goal>
             </goals>
             <configuration>
-              <sourceDirectory>${project.build.directory}/generated-sources/annotations</sourceDirectory>
+              <sourceDirectory>${project.build.directory}/generated-sources/javacc</sourceDirectory>
               <includes>
-                <include>**/Parser.jj</include>
+                <include>Parser.jj</include>
               </includes>
               <lookAhead>2</lookAhead>
               <isStatic>false</isStatic>
-              <outputDirectory>${project.build.directory}/generated-sources/annotations</outputDirectory>
+              <outputDirectory>${project.build.directory}/generated-sources</outputDirectory>
             </configuration>
           </execution>
         </executions>
@@ -381,7 +412,7 @@
             </goals>
             <configuration>
               <sources>
-                <source>src/generated-sources/annotations</source>
+                <source>src/generated-sources</source>
               </sources>
             </configuration>
           </execution>
diff --git a/sql/src/main/codegen/config.fmpp b/sql/src/main/codegen/config.fmpp
index 31fe812bbec7..3a8f51189bd1 100644
--- a/sql/src/main/codegen/config.fmpp
+++ b/sql/src/main/codegen/config.fmpp
@@ -58,6 +58,8 @@ data: {
       "org.apache.druid.java.util.common.granularity.Granularities"
       "org.apache.druid.sql.calcite.parser.DruidSqlInsert"
       "org.apache.druid.sql.calcite.parser.DruidSqlParserUtils"
+      "org.apache.druid.sql.calcite.external.ExtendOperator"
+      "org.apache.druid.sql.calcite.external.ParameterizeOperator"
     ]
 
     # List of new keywords. Example: "DATABASES", "TABLES". If the keyword is not a reserved
diff --git a/sql/src/main/java/org/apache/druid/sql/AbstractStatement.java b/sql/src/main/java/org/apache/druid/sql/AbstractStatement.java
index 1956b353b770..05152625d8c3 100644
--- a/sql/src/main/java/org/apache/druid/sql/AbstractStatement.java
+++ b/sql/src/main/java/org/apache/druid/sql/AbstractStatement.java
@@ -32,6 +32,7 @@
 import org.apache.druid.server.security.ResourceType;
 import org.apache.druid.sql.calcite.planner.DruidPlanner;
 import org.apache.druid.sql.calcite.planner.PlannerContext;
+import org.apache.druid.sql.calcite.planner.PlannerHook;
 
 import java.io.Closeable;
 import java.util.HashMap;
@@ -71,6 +72,7 @@ public abstract class AbstractStatement implements Closeable
   protected final Map<String, Object> queryContext;
   protected PlannerContext plannerContext;
   protected DruidPlanner.AuthResult authResult;
+  protected PlannerHook hook;
 
   public AbstractStatement(
       final SqlToolbox sqlToolbox,
@@ -109,6 +111,15 @@ public Map<String, Object> context()
     return queryContext;
   }
 
+  /**
+   * Set the hook which can capture planner artifacts during planning. Primarily used
+   * for testing. Defaults to a "no op" hook that does nothing.
+   */
+  public void setHook(PlannerHook hook)
+  {
+    this.hook = hook;
+  }
+
   /**
    * Validate SQL query and authorize against any datasources or views which
    * will take part in the query. Must be called by the API methods, not
diff --git a/sql/src/main/java/org/apache/druid/sql/DirectStatement.java b/sql/src/main/java/org/apache/druid/sql/DirectStatement.java
index d3d9371a3968..ad24274ceb09 100644
--- a/sql/src/main/java/org/apache/druid/sql/DirectStatement.java
+++ b/sql/src/main/java/org/apache/druid/sql/DirectStatement.java
@@ -206,7 +206,8 @@ public ResultSet plan()
     try (DruidPlanner planner = sqlToolbox.plannerFactory.createPlanner(
         sqlToolbox.engine,
         queryPlus.sql(),
-        queryContext
+        queryContext,
+        hook
     )) {
       validate(planner);
       authorize(planner, authorizer());
diff --git a/sql/src/main/java/org/apache/druid/sql/PreparedStatement.java b/sql/src/main/java/org/apache/druid/sql/PreparedStatement.java
index 1774aa31feda..bdbccb1ff6f1 100644
--- a/sql/src/main/java/org/apache/druid/sql/PreparedStatement.java
+++ b/sql/src/main/java/org/apache/druid/sql/PreparedStatement.java
@@ -66,9 +66,12 @@ public PreparedStatement(
   public PrepareResult prepare()
   {
     try (DruidPlanner planner = sqlToolbox.plannerFactory.createPlanner(
-        sqlToolbox.engine,
-        queryPlus.sql(),
-        queryContext)) {
+            sqlToolbox.engine,
+            queryPlus.sql(),
+            queryContext,
+            hook
+        )
+    ) {
       validate(planner);
       authorize(planner, authorizer());
 
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/expression/Expressions.java b/sql/src/main/java/org/apache/druid/sql/calcite/expression/Expressions.java
index fa09d99d1f06..b1805519ade9 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/expression/Expressions.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/expression/Expressions.java
@@ -93,7 +93,12 @@ public static RexNode fromFieldAccess(
   )
   {
     if (project == null) {
-      // I don't think the factory impl matters here.
+      // Gian doesn't think the factory impl matters here, he's likely correct.  But, upon reading what this is doing,
+      // we are re-building the list of things in the RelDataType for every single call to `fromFieldAccess`.
+      // `fromFieldAccess` is called pretty regularly in pretty low-level areas of the code, so it would make sense
+      // that we are perhaps re-creating the exact same object over and over and over and over again and wasting CPU
+      // cycles.  It would likely be good to refactor the code such that we ensure we only ever compute the thing
+      // once and then reuse it.
       return RexInputRef.of(fieldNumber, RowSignatures.toRelDataType(rowSignature, new JavaTypeFactoryImpl()));
     } else {
       return project.getChildExps().get(fieldNumber);
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/expression/WindowSqlAggregate.java b/sql/src/main/java/org/apache/druid/sql/calcite/expression/WindowSqlAggregate.java
new file mode 100644
index 000000000000..7dd158d91f3a
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/expression/WindowSqlAggregate.java
@@ -0,0 +1,70 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.expression;
+
+import org.apache.calcite.rel.core.AggregateCall;
+import org.apache.calcite.rel.core.Project;
+import org.apache.calcite.rex.RexBuilder;
+import org.apache.calcite.sql.SqlAggFunction;
+import org.apache.druid.java.util.common.UOE;
+import org.apache.druid.segment.column.RowSignature;
+import org.apache.druid.sql.calcite.aggregation.Aggregation;
+import org.apache.druid.sql.calcite.aggregation.SqlAggregator;
+import org.apache.druid.sql.calcite.planner.PlannerContext;
+import org.apache.druid.sql.calcite.rel.VirtualColumnRegistry;
+
+import javax.annotation.Nullable;
+import java.util.List;
+
+/**
+ * Conversion for SQL operators that map 1-1 onto native functions.
+ */
+public class WindowSqlAggregate implements SqlAggregator
+{
+  private final SqlAggFunction operator;
+
+  public WindowSqlAggregate(final SqlAggFunction operator)
+  {
+    this.operator = operator;
+  }
+
+  @Override
+  public SqlAggFunction calciteFunction()
+  {
+    return operator;
+  }
+
+  @Nullable
+  @Override
+  public Aggregation toDruidAggregation(
+      PlannerContext plannerContext,
+      RowSignature rowSignature,
+      VirtualColumnRegistry virtualColumnRegistry,
+      RexBuilder rexBuilder,
+      String name,
+      AggregateCall aggregateCall,
+      Project project,
+      List<Aggregation> existingAggregations,
+      boolean finalizeAggregations
+  )
+  {
+    throw new UOE("%s can only be used in a window function, this method shouldn't be called...", operator.getName());
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/CatalogExternalTableOperatorConversion.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/CatalogExternalTableOperatorConversion.java
new file mode 100644
index 000000000000..4bbfbe270066
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/CatalogExternalTableOperatorConversion.java
@@ -0,0 +1,170 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.external;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+import org.apache.calcite.rex.RexNode;
+import org.apache.calcite.schema.FunctionParameter;
+import org.apache.calcite.schema.TranslatableTable;
+import org.apache.calcite.sql.SqlCall;
+import org.apache.calcite.sql.SqlIdentifier;
+import org.apache.calcite.sql.SqlNodeList;
+import org.apache.calcite.sql.SqlOperator;
+import org.apache.calcite.sql.parser.SqlParserPos;
+import org.apache.calcite.sql.type.ReturnTypes;
+import org.apache.calcite.sql.validate.SqlUserDefinedTableMacro;
+import org.apache.druid.catalog.model.TableDefnRegistry;
+import org.apache.druid.catalog.model.table.ExternalTableDefn;
+import org.apache.druid.catalog.model.table.ExternalTableSpec;
+import org.apache.druid.java.util.common.IAE;
+import org.apache.druid.segment.column.RowSignature;
+import org.apache.druid.server.security.ResourceAction;
+import org.apache.druid.sql.calcite.expression.AuthorizableOperator;
+import org.apache.druid.sql.calcite.expression.DruidExpression;
+import org.apache.druid.sql.calcite.expression.SqlOperatorConversion;
+import org.apache.druid.sql.calcite.external.UserDefinedTableMacroFunction.ExtendedTableMacro;
+import org.apache.druid.sql.calcite.planner.PlannerContext;
+
+import javax.annotation.Nullable;
+
+import java.util.Collections;
+import java.util.List;
+import java.util.Set;
+
+/**
+ * Base class for input-source-specfic table functions with arguments derived from
+ * a catalog external table definition. Such functions work in conjunction with the
+ * EXTERN key word to provide a schema. Example of the HTTP form:
+ * <code><pre>
+ * INSERT INTO myTable SELECT ...
+ * FROM TABLE(http(
+ *     userName => 'bob',
+ *     password => 'secret',
+ *     uris => 'http:foo.com/bar.csv',
+ *     format => 'csv'))
+ *   EXTEND (x VARCHAR, y VARCHAR, z BIGINT)
+ * PARTITIONED BY ...
+ * </pre></code>
+ */
+public abstract class CatalogExternalTableOperatorConversion implements SqlOperatorConversion
+{
+  private final SqlUserDefinedTableMacro operator;
+
+  public CatalogExternalTableOperatorConversion(
+      final String name,
+      final TableDefnRegistry registry,
+      final String tableType,
+      final ObjectMapper jsonMapper
+  )
+  {
+    ExternalTableDefn tableDefn = (ExternalTableDefn) registry.defnFor(tableType);
+    this.operator = new CatalogExternalTableOperator(
+        new CatalogTableMacro(
+            name,
+            tableDefn,
+            jsonMapper
+        )
+    );
+  }
+
+  @Override
+  public SqlOperator calciteOperator()
+  {
+    return operator;
+  }
+
+  @Nullable
+  @Override
+  public DruidExpression toDruidExpression(PlannerContext plannerContext, RowSignature rowSignature, RexNode rexNode)
+  {
+    return null;
+  }
+
+  public static class CatalogExternalTableOperator extends UserDefinedTableMacroFunction implements AuthorizableOperator
+  {
+    public CatalogExternalTableOperator(final CatalogTableMacro macro)
+    {
+      super(
+          new SqlIdentifier(macro.name, SqlParserPos.ZERO),
+          ReturnTypes.CURSOR,
+          null,
+          // Use our own definition of variadic since Calcite's doesn't allow
+          // optional parameters.
+          Externals.variadic(macro.parameters),
+          Externals.dataTypes(macro.parameters),
+          macro
+      );
+    }
+
+    @Override
+    public Set<ResourceAction> computeResources(final SqlCall call)
+    {
+      return Collections.singleton(ExternalOperatorConversion.EXTERNAL_RESOURCE_ACTION);
+    }
+  }
+
+  public static class CatalogTableMacro implements ExtendedTableMacro
+  {
+    private final String name;
+    private final List<FunctionParameter> parameters;
+    private final ExternalTableDefn tableDefn;
+    private final ObjectMapper jsonMapper;
+
+    public CatalogTableMacro(
+        final String name,
+        final ExternalTableDefn tableDefn,
+        final ObjectMapper jsonMapper
+    )
+    {
+      this.name = name;
+      this.tableDefn = tableDefn;
+      this.jsonMapper = jsonMapper;
+      this.parameters = Externals.convertParameters(tableDefn);
+    }
+
+    @Override
+    public TranslatableTable apply(final List<Object> arguments)
+    {
+      throw new IAE(
+          "The %s table function requires an EXTEND clause with a schema.",
+          name
+      );
+    }
+
+    @Override
+    public TranslatableTable apply(List<Object> arguments, SqlNodeList schema)
+    {
+      final ExternalTableSpec externSpec = Externals.convertArguments(
+          tableDefn,
+          parameters,
+          arguments,
+          schema,
+          jsonMapper
+      );
+      return Externals.buildExternalTable(externSpec, jsonMapper);
+    }
+
+    @Override
+    public List<FunctionParameter> getParameters()
+    {
+      return parameters;
+    }
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/ExtendOperator.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/ExtendOperator.java
new file mode 100644
index 000000000000..7e7011d8a67d
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/ExtendOperator.java
@@ -0,0 +1,75 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.external;
+
+import org.apache.calcite.sql.SqlBasicCall;
+import org.apache.calcite.sql.SqlCall;
+import org.apache.calcite.sql.SqlInternalOperator;
+import org.apache.calcite.sql.SqlKind;
+import org.apache.calcite.sql.SqlNode;
+import org.apache.calcite.sql.SqlNodeList;
+import org.apache.calcite.sql.fun.SqlCollectionTableOperator;
+import org.apache.calcite.sql.fun.SqlStdOperatorTable;
+import org.apache.calcite.sql.validate.SqlValidator;
+import org.apache.druid.java.util.common.ISE;
+
+/**
+ * Druid-specific implementation of the EXTEND operator in Calcite, which
+ * is said to have been added for Apache Phoenix, and which we repurpose to
+ * supply a schema for an ingest input table.
+ *
+ * @see {@link UserDefinedTableMacroFunction} for details
+ */
+public class ExtendOperator extends SqlInternalOperator
+{
+  //  private static final TableMacro macro = new ExtendsMacroWrapper();
+  public static final ExtendOperator EXTEND = new ExtendOperator();
+
+  ExtendOperator()
+  {
+    super("EXTEND", SqlKind.EXTEND, MDX_PRECEDENCE);
+  }
+
+  /**
+   * Rewrite the EXTEND node (which, in Druid, has a structure different
+   * than what Calcite expects), into a table macro, with the schema
+   * squirreled away in an ad-hoc instance of the macro. We must do it
+   * this way because we can't change Calcite to define a new node type
+   * that holds onto the schema.
+   */
+  @Override
+  public SqlNode rewriteCall(SqlValidator validator, SqlCall call)
+  {
+    SqlBasicCall tableOpCall = (SqlBasicCall) call.operand(0);
+    if (!(tableOpCall.getOperator() instanceof SqlCollectionTableOperator)) {
+      throw new ISE("First argument to EXTEND must be a table function");
+    }
+    SqlBasicCall tableFnCall = (SqlBasicCall) tableOpCall.operand(0);
+    if (!(tableFnCall.getOperator() instanceof UserDefinedTableMacroFunction)) {
+      // May be an unresolved function.
+      return call;
+    }
+    UserDefinedTableMacroFunction macro = (UserDefinedTableMacroFunction) tableFnCall.getOperator();
+
+    SqlNodeList schema = (SqlNodeList) call.operand(1);
+    SqlCall newCall = macro.rewriteCall(tableFnCall, schema);
+    return SqlStdOperatorTable.COLLECTION_TABLE.createCall(call.getParserPosition(), newCall);
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/ExternalOperatorConversion.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/ExternalOperatorConversion.java
index 3cde403f717a..1ca17e86927c 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/external/ExternalOperatorConversion.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/ExternalOperatorConversion.java
@@ -19,8 +19,8 @@
 
 package org.apache.druid.sql.calcite.external;
 
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.inject.Inject;
-import org.apache.calcite.rel.type.RelDataTypeFactory;
 import org.apache.calcite.rex.RexNode;
 import org.apache.calcite.sql.SqlCall;
 import org.apache.calcite.sql.SqlIdentifier;
@@ -28,9 +28,9 @@
 import org.apache.calcite.sql.parser.SqlParserPos;
 import org.apache.calcite.sql.type.OperandTypes;
 import org.apache.calcite.sql.type.ReturnTypes;
-import org.apache.calcite.sql.type.SqlTypeFactoryImpl;
 import org.apache.calcite.sql.type.SqlTypeFamily;
 import org.apache.calcite.sql.validate.SqlUserDefinedTableMacro;
+import org.apache.druid.guice.annotations.Json;
 import org.apache.druid.segment.column.RowSignature;
 import org.apache.druid.server.security.Action;
 import org.apache.druid.server.security.Resource;
@@ -48,7 +48,8 @@
 import java.util.stream.Collectors;
 
 /**
- * Registers the "EXTERN" operator, which is used in queries like "INSERT INTO dst SELECT * FROM TABLE(EXTERN(...))".
+ * Registers the "EXTERN" operator, which is used in queries like
+ * "INSERT INTO dst SELECT * FROM TABLE(EXTERN(...))".
  *
  * This class is exercised in CalciteInsertDmlTest but is not currently exposed to end users.
  */
@@ -60,14 +61,12 @@ public class ExternalOperatorConversion implements SqlOperatorConversion
   public static final ResourceAction EXTERNAL_RESOURCE_ACTION =
       new ResourceAction(new Resource("EXTERNAL", ResourceType.EXTERNAL), Action.READ);
 
-  private static final RelDataTypeFactory TYPE_FACTORY = new SqlTypeFactoryImpl(DruidTypeSystem.INSTANCE);
-
   private final SqlUserDefinedTableMacro operator;
 
   @Inject
-  public ExternalOperatorConversion(final ExternalTableMacro macro)
+  public ExternalOperatorConversion(@Json final ObjectMapper jsonMapper)
   {
-    this.operator = new ExternalOperator(macro);
+    this.operator = new ExternalOperator(new ExternalTableMacro(jsonMapper));
   }
 
   @Override
@@ -92,14 +91,14 @@ public ExternalOperator(final ExternalTableMacro macro)
           ReturnTypes.CURSOR,
           null,
           OperandTypes.sequence(
-              "(inputSource, inputFormat, signature)",
+              macro.signature(),
               OperandTypes.family(SqlTypeFamily.STRING),
               OperandTypes.family(SqlTypeFamily.STRING),
               OperandTypes.family(SqlTypeFamily.STRING)
           ),
           macro.getParameters()
                .stream()
-               .map(parameter -> parameter.getType(TYPE_FACTORY))
+               .map(parameter -> parameter.getType(DruidTypeSystem.TYPE_FACTORY))
                .collect(Collectors.toList()),
           macro
       );
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/ExternalTableMacro.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/ExternalTableMacro.java
index 23c0b1d9c40d..ac65880c1e9a 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/external/ExternalTableMacro.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/ExternalTableMacro.java
@@ -22,63 +22,56 @@
 import com.fasterxml.jackson.core.JsonProcessingException;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
-import com.google.inject.Inject;
-import org.apache.calcite.rel.type.RelDataType;
-import org.apache.calcite.rel.type.RelDataTypeFactory;
 import org.apache.calcite.schema.FunctionParameter;
 import org.apache.calcite.schema.TableMacro;
 import org.apache.calcite.schema.TranslatableTable;
+import org.apache.druid.catalog.model.table.ExternalTableSpec;
 import org.apache.druid.data.input.InputFormat;
 import org.apache.druid.data.input.InputSource;
-import org.apache.druid.guice.annotations.Json;
-import org.apache.druid.java.util.common.ISE;
-import org.apache.druid.segment.column.ColumnHolder;
-import org.apache.druid.segment.column.ColumnType;
 import org.apache.druid.segment.column.RowSignature;
+import org.apache.druid.sql.calcite.planner.DruidTypeSystem;
 import org.apache.druid.sql.calcite.table.DruidTable;
-import org.apache.druid.sql.calcite.table.ExternalTable;
 
 import java.util.List;
-import java.util.Optional;
+import java.util.stream.Collectors;
 
 /**
- * Used by {@link ExternalOperatorConversion} to generate {@link DruidTable} that reference {@link ExternalDataSource}.
+ * Used by {@link ExternalOperatorConversion} to generate a {@link DruidTable}
+ * that references an {@link ExternalDataSource}.
  *
  * This class is exercised in CalciteInsertDmlTest but is not currently exposed to end users.
  */
 public class ExternalTableMacro implements TableMacro
 {
+  private final List<FunctionParameter> parameters = ImmutableList.of(
+      new FunctionParameterImpl(0, "inputSource", DruidTypeSystem.TYPE_FACTORY.createJavaType(String.class)),
+      new FunctionParameterImpl(1, "inputFormat", DruidTypeSystem.TYPE_FACTORY.createJavaType(String.class)),
+      new FunctionParameterImpl(2, "signature", DruidTypeSystem.TYPE_FACTORY.createJavaType(String.class))
+  );
+
   private final ObjectMapper jsonMapper;
 
-  @Inject
-  public ExternalTableMacro(@Json final ObjectMapper jsonMapper)
+  public ExternalTableMacro(final ObjectMapper jsonMapper)
   {
     this.jsonMapper = jsonMapper;
   }
 
+  public String signature()
+  {
+    final List<String> names = parameters.stream().map(p -> p.getName()).collect(Collectors.toList());
+    return "(" + String.join(", ", names) + ")";
+  }
+
   @Override
   public TranslatableTable apply(final List<Object> arguments)
   {
     try {
-      final InputSource inputSource = jsonMapper.readValue((String) arguments.get(0), InputSource.class);
-      final InputFormat inputFormat = jsonMapper.readValue((String) arguments.get(1), InputFormat.class);
-      final RowSignature signature = jsonMapper.readValue((String) arguments.get(2), RowSignature.class);
-
-      // Prevent a RowSignature that has a ColumnSignature with name "__time" and type that is not LONG because it
-      // will be automatically casted to LONG while processing in RowBasedColumnSelectorFactory.
-      // This can cause an issue when the incorrectly typecasted data is ingested or processed upon. One such example
-      // of inconsistency is that functions such as TIME_PARSE evaluate incorrectly
-      Optional<ColumnType> timestampColumnTypeOptional = signature.getColumnType(ColumnHolder.TIME_COLUMN_NAME);
-      if (timestampColumnTypeOptional.isPresent() && !timestampColumnTypeOptional.get().equals(ColumnType.LONG)) {
-        throw new ISE("EXTERN function with __time column can be used when __time column is of type long. "
-                      + "Please change the column name to something other than __time");
-      }
-
-      return new ExternalTable(
-            new ExternalDataSource(inputSource, inputFormat, signature),
-            signature,
-            jsonMapper
+      ExternalTableSpec spec = new ExternalTableSpec(
+          jsonMapper.readValue((String) arguments.get(0), InputSource.class),
+          jsonMapper.readValue((String) arguments.get(1), InputFormat.class),
+          jsonMapper.readValue((String) arguments.get(2), RowSignature.class)
       );
+      return Externals.buildExternalTable(spec, jsonMapper);
     }
     catch (JsonProcessingException e) {
       throw new RuntimeException(e);
@@ -88,85 +81,6 @@ public TranslatableTable apply(final List<Object> arguments)
   @Override
   public List<FunctionParameter> getParameters()
   {
-    return ImmutableList.of(
-        new FunctionParameter()
-        {
-          @Override
-          public int getOrdinal()
-          {
-            return 0;
-          }
-
-          @Override
-          public String getName()
-          {
-            return "inputSource";
-          }
-
-          @Override
-          public RelDataType getType(RelDataTypeFactory typeFactory)
-          {
-            return typeFactory.createJavaType(String.class);
-          }
-
-          @Override
-          public boolean isOptional()
-          {
-            return false;
-          }
-        },
-        new FunctionParameter()
-        {
-          @Override
-          public int getOrdinal()
-          {
-            return 1;
-          }
-
-          @Override
-          public String getName()
-          {
-            return "inputFormat";
-          }
-
-          @Override
-          public RelDataType getType(RelDataTypeFactory typeFactory)
-          {
-            return typeFactory.createJavaType(String.class);
-          }
-
-          @Override
-          public boolean isOptional()
-          {
-            return false;
-          }
-        },
-        new FunctionParameter()
-        {
-          @Override
-          public int getOrdinal()
-          {
-            return 2;
-          }
-
-          @Override
-          public String getName()
-          {
-            return "signature";
-          }
-
-          @Override
-          public RelDataType getType(RelDataTypeFactory typeFactory)
-          {
-            return typeFactory.createJavaType(String.class);
-          }
-
-          @Override
-          public boolean isOptional()
-          {
-            return false;
-          }
-        }
-    );
+    return parameters;
   }
 }
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/Externals.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/Externals.java
new file mode 100644
index 000000000000..8658fb3eb48c
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/Externals.java
@@ -0,0 +1,278 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.external;
+
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.collect.ImmutableList;
+import org.apache.calcite.avatica.SqlType;
+import org.apache.calcite.rel.type.RelDataType;
+import org.apache.calcite.schema.FunctionParameter;
+import org.apache.calcite.sql.SqlCallBinding;
+import org.apache.calcite.sql.SqlDataTypeSpec;
+import org.apache.calcite.sql.SqlIdentifier;
+import org.apache.calcite.sql.SqlNodeList;
+import org.apache.calcite.sql.SqlOperandCountRange;
+import org.apache.calcite.sql.SqlOperator;
+import org.apache.calcite.sql.SqlTypeNameSpec;
+import org.apache.calcite.sql.type.SqlOperandCountRanges;
+import org.apache.calcite.sql.type.SqlOperandTypeChecker;
+import org.apache.calcite.sql.type.SqlTypeName;
+import org.apache.druid.catalog.model.ModelProperties;
+import org.apache.druid.catalog.model.ModelProperties.PropertyDefn;
+import org.apache.druid.catalog.model.PropertyAttributes;
+import org.apache.druid.catalog.model.ResolvedTable;
+import org.apache.druid.catalog.model.table.ExternalTableDefn;
+import org.apache.druid.catalog.model.table.ExternalTableSpec;
+import org.apache.druid.catalog.model.table.TableBuilder;
+import org.apache.druid.java.util.common.IAE;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.segment.column.ColumnHolder;
+import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.sql.calcite.planner.DruidTypeSystem;
+import org.apache.druid.sql.calcite.table.ExternalTable;
+
+import java.util.List;
+import java.util.Optional;
+import java.util.stream.Collectors;
+
+/**
+ * Conversion functions to-from the SQL, catalog and MSQ representations
+ * of external tables.
+ */
+public class Externals
+{
+  /**
+   * Convert parameters from Catalog external table definition form to the SQL form
+   * used for a table macro and its function.
+   */
+  public static List<FunctionParameter> convertParameters(final ExternalTableDefn tableDefn)
+  {
+    List<ModelProperties.PropertyDefn<?>> props = tableDefn.tableFunctionParameters();
+    ImmutableList.Builder<FunctionParameter> params = ImmutableList.builder();
+    for (int i = 0; i < props.size(); i++) {
+      ModelProperties.PropertyDefn<?> prop = props.get(i);
+      params.add(new FunctionParameterImpl(
+          i,
+          prop.name(),
+          DruidTypeSystem.TYPE_FACTORY.createJavaType(PropertyAttributes.sqlParameterType(prop)),
+          PropertyAttributes.isOptional(prop)
+      ));
+    }
+    return params.build();
+  }
+
+  /**
+   * Extract the data types (only) from a list of SQL parameters.
+   */
+  public static List<RelDataType> dataTypes(List<FunctionParameter> parameters)
+  {
+    return parameters
+        .stream()
+        .map(parameter -> parameter.getType(DruidTypeSystem.TYPE_FACTORY))
+        .collect(Collectors.toList());
+  }
+
+  /**
+   * Define a variadic (variable arity) type checker that allows an argument
+   * count that ranges from the number of required parameters to the number of
+   * available parameters. We have to define this because the Calcite form does
+   * not allow optional parameters, but we allow any parameter to be optional.
+   * We are also not fussy about the type: we catch any type errors from the
+   * declared types. We catch missing required parameters at conversion time,
+   * where we also catch invalid values, incompatible values, and so on.
+   */
+  public static SqlOperandTypeChecker variadic(List<FunctionParameter> params)
+  {
+    int min = 0;
+    for (FunctionParameter param : params) {
+      if (!param.isOptional()) {
+        min++;
+      }
+    }
+    SqlOperandCountRange range = SqlOperandCountRanges.between(min, params.size());
+    return new SqlOperandTypeChecker()
+    {
+      @Override
+      public boolean checkOperandTypes(
+          SqlCallBinding callBinding,
+          boolean throwOnFailure)
+      {
+        return range.isValidCount(callBinding.getOperandCount());
+      }
+
+      @Override
+      public SqlOperandCountRange getOperandCountRange()
+      {
+        return range;
+      }
+
+      @Override
+      public String getAllowedSignatures(SqlOperator op, String opName)
+      {
+        return opName + "(...)";
+      }
+
+      @Override
+      public boolean isOptional(int i)
+      {
+        return true;
+      }
+
+      @Override
+      public Consistency getConsistency()
+      {
+        return Consistency.NONE;
+      }
+    };
+  }
+
+  /**
+   * Convert the actual arguments to SQL external table function into a catalog
+   * resolved table, then convert that to an external table spec usable by MSQ.
+   *
+   * @param tableDefn catalog definition of the kind of external table
+   * @param parameters the parameters to the SQL table macro
+   * @param arguments the arguments that match the parameters. Optional arguments
+   *                  may be null
+   * @param schema    the external table schema provided by the EXTEND clause
+   * @param jsonMapper the JSON mapper to use for value conversions
+   * @return a spec with the three values that MSQ needs to create an external table
+   */
+  public static ExternalTableSpec convertArguments(
+      final ExternalTableDefn tableDefn,
+      final List<FunctionParameter> parameters,
+      final List<Object> arguments,
+      final SqlNodeList schema,
+      final ObjectMapper jsonMapper
+  )
+  {
+    final TableBuilder builder = TableBuilder.of(tableDefn);
+    for (int i = 0; i < parameters.size(); i++) {
+      String name = parameters.get(i).getName();
+      Object value = arguments.get(i);
+      if (value == null) {
+        continue;
+      }
+      PropertyDefn<?> prop = tableDefn.property(name);
+      builder.property(name, prop.decodeSqlValue(value, jsonMapper));
+    }
+
+    // Converts from a list of (identifier, type, ...) pairs to
+    // a Druid row signature. The schema itself comes from the
+    // Druid-specific EXTEND syntax added to the parser.
+    for (int i = 0; i < schema.size(); i += 2) {
+      final String name = convertName((SqlIdentifier) schema.get(i));
+      String sqlType = convertType(name, (SqlDataTypeSpec) schema.get(i + 1));
+      builder.column(name, sqlType);
+    }
+    ResolvedTable table = builder.buildResolved(jsonMapper);
+    return tableDefn.convertToExtern(table);
+  }
+
+
+  /**
+   * Define the Druid input schema from a name provided in the EXTEND
+   * clause. Calcite allows any form of name: a.b.c, say. But, Druid
+   * requires only simple names: "a", or "x".
+   */
+  private static String convertName(SqlIdentifier ident)
+  {
+    if (!ident.isSimple()) {
+      throw new IAE(StringUtils.format(
+          "Column [%s] must have a simple name",
+          ident));
+    }
+    return ident.getSimple();
+  }
+
+  /**
+   * Define the SQL input column type from a type provided in the
+   * EXTEND clause. Calcite allows any form of type. But, Druid
+   * requires only the Druid supported types (and their aliases.)
+   * <p>
+   * Druid has its own rules for nullability. We ignore any nullability
+   * clause in the EXTEND list.
+   */
+  private static String convertType(String name, SqlDataTypeSpec dataType)
+  {
+    SqlTypeNameSpec spec = dataType.getTypeNameSpec();
+    if (spec == null) {
+      throw unsupportedType(name, dataType);
+    }
+    SqlIdentifier typeName = spec.getTypeName();
+    if (typeName == null || !typeName.isSimple()) {
+      throw unsupportedType(name, dataType);
+    }
+    SqlTypeName type = SqlTypeName.get(typeName.getSimple());
+    if (type == null) {
+      throw unsupportedType(name, dataType);
+    }
+    if (SqlTypeName.CHAR_TYPES.contains(type)) {
+      return SqlTypeName.VARCHAR.name();
+    }
+    if (SqlTypeName.INT_TYPES.contains(type)) {
+      return SqlTypeName.BIGINT.name();
+    }
+    switch (type) {
+      case DOUBLE:
+        return SqlType.DOUBLE.name();
+      case FLOAT:
+      case REAL:
+        return SqlType.FLOAT.name();
+      default:
+        throw unsupportedType(name, dataType);
+    }
+  }
+
+  private static RuntimeException unsupportedType(String name, SqlDataTypeSpec dataType)
+  {
+    return new IAE(StringUtils.format(
+        "Column [%s] has an unsupported type: [%s]",
+        name,
+        dataType));
+  }
+
+  /**
+   * Create an MSQ ExternalTable given an external table spec. Enforces type restructions
+   * (which should be revisited.)
+   */
+  public static ExternalTable buildExternalTable(ExternalTableSpec spec, ObjectMapper jsonMapper)
+  {
+    // Prevent a RowSignature that has a ColumnSignature with name "__time" and type that is not LONG because it
+    // will be automatically cast to LONG while processing in RowBasedColumnSelectorFactory.
+    // This can cause an issue when the incorrectly type-casted data is ingested or processed upon. One such example
+    // of inconsistency is that functions such as TIME_PARSE evaluate incorrectly
+    //
+    // TODO: Fix the underlying problem: we should not make assumptions about the input
+    // data, nor restrict the form of that data.
+    Optional<ColumnType> timestampColumnTypeOptional = spec.signature.getColumnType(ColumnHolder.TIME_COLUMN_NAME);
+    if (timestampColumnTypeOptional.isPresent() && !timestampColumnTypeOptional.get().equals(ColumnType.LONG)) {
+      throw new ISE("EXTERN function with __time column can be used when __time column is of type long. "
+                    + "Please change the column name to something other than __time");
+    }
+
+    return new ExternalTable(
+          new ExternalDataSource(spec.inputSource, spec.inputFormat, spec.signature),
+          spec.signature,
+          jsonMapper
+    );
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/FunctionParameterImpl.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/FunctionParameterImpl.java
new file mode 100644
index 000000000000..ec6b1e098440
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/FunctionParameterImpl.java
@@ -0,0 +1,81 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.external;
+
+import org.apache.calcite.rel.type.RelDataType;
+import org.apache.calcite.rel.type.RelDataTypeFactory;
+import org.apache.calcite.schema.FunctionParameter;
+
+public class FunctionParameterImpl implements FunctionParameter
+{
+  private final int ordinal;
+  private final String name;
+  private final RelDataType type;
+  private final boolean isOptional;
+
+  public FunctionParameterImpl(int ordinal, String name, RelDataType type, boolean isOptional)
+  {
+    this.ordinal = ordinal;
+    this.name = name;
+    this.type = type;
+    this.isOptional = isOptional;
+  }
+
+  public FunctionParameterImpl(int ordinal, String name, RelDataType type)
+  {
+    this(ordinal, name, type, false);
+  }
+
+  @Override
+  public int getOrdinal()
+  {
+    return ordinal;
+  }
+
+  @Override
+  public String getName()
+  {
+    return name;
+  }
+
+  @Override
+  public RelDataType getType(RelDataTypeFactory typeFactory)
+  {
+    return type;
+  }
+
+  @Override
+  public boolean isOptional()
+  {
+    return isOptional;
+  }
+
+  @Override
+  public String toString()
+  {
+    return "FunctionParameter{" +
+        "name=\"" + name + "\"" +
+        ", ordinal=" + ordinal +
+        ", type=" + type +
+        ", optional=" + isOptional +
+        "}";
+  }
+
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/HttpOperatorConversion.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/HttpOperatorConversion.java
new file mode 100644
index 000000000000..8f864808d76c
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/HttpOperatorConversion.java
@@ -0,0 +1,37 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.external;
+
+import com.google.inject.Inject;
+import org.apache.druid.catalog.model.TableDefnRegistry;
+import org.apache.druid.catalog.model.table.HttpTableDefn;
+
+public class HttpOperatorConversion extends CatalogExternalTableOperatorConversion
+{
+  public static final String FUNCTION_NAME = "http";
+
+  @Inject
+  public HttpOperatorConversion(
+      final TableDefnRegistry registry
+  )
+  {
+    super(FUNCTION_NAME, registry, HttpTableDefn.TABLE_TYPE, registry.jsonMapper());
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/InlineOperatorConversion.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/InlineOperatorConversion.java
new file mode 100644
index 000000000000..989764143525
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/InlineOperatorConversion.java
@@ -0,0 +1,37 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.external;
+
+import com.google.inject.Inject;
+import org.apache.druid.catalog.model.TableDefnRegistry;
+import org.apache.druid.catalog.model.table.InlineTableDefn;
+
+public class InlineOperatorConversion extends CatalogExternalTableOperatorConversion
+{
+  public static final String FUNCTION_NAME = "inline";
+
+  @Inject
+  public InlineOperatorConversion(
+      final TableDefnRegistry registry
+  )
+  {
+    super(FUNCTION_NAME, registry, InlineTableDefn.TABLE_TYPE, registry.jsonMapper());
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/LocalOperatorConversion.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/LocalOperatorConversion.java
new file mode 100644
index 000000000000..c063793d5b14
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/LocalOperatorConversion.java
@@ -0,0 +1,39 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.external;
+
+import com.google.inject.Inject;
+import org.apache.druid.catalog.model.TableDefnRegistry;
+import org.apache.druid.catalog.model.table.LocalTableDefn;
+
+public class LocalOperatorConversion extends CatalogExternalTableOperatorConversion
+{
+  // Cannot use "local" because it is a SQL keyword and the user would
+  // be required to quote the name.
+  public static final String FUNCTION_NAME = "localfiles";
+
+  @Inject
+  public LocalOperatorConversion(
+      final TableDefnRegistry registry
+  )
+  {
+    super(FUNCTION_NAME, registry, LocalTableDefn.TABLE_TYPE, registry.jsonMapper());
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/ParameterizeOperator.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/ParameterizeOperator.java
new file mode 100644
index 000000000000..a50c322560f8
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/ParameterizeOperator.java
@@ -0,0 +1,69 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.external;
+
+import com.google.common.collect.ImmutableList;
+import org.apache.calcite.sql.SqlBasicCall;
+import org.apache.calcite.sql.SqlCall;
+import org.apache.calcite.sql.SqlInternalOperator;
+import org.apache.calcite.sql.SqlKind;
+import org.apache.calcite.sql.SqlNode;
+import org.apache.calcite.sql.parser.Span;
+import org.apache.calcite.sql.validate.SqlValidator;
+
+import java.util.List;
+
+/**
+ * Internal operator used to create an on-the-fly table function from a
+ * partial table definition within the catalog. Represents a table reference
+ * of the form: <i>table_name</i>( <i>arguments</i> ). That, is we treat the
+ * table name as a function name, then pass arguments that represent the additional
+ * information needed to convert a partial table into a completed table.
+ * For example, for a local input source, we might pass the list of files to
+ * read.
+ * <p>
+ * Calcite doesn't understand this form. So, early in the process, we rewrite
+ * nodes of this type into a table macro node which Calcite does understand.
+ */
+public class ParameterizeOperator extends SqlInternalOperator
+{
+  public static final ParameterizeOperator PARAM = new ParameterizeOperator();
+
+  ParameterizeOperator()
+  {
+    super("PARAMETERS", SqlKind.OTHER, MDX_PRECEDENCE);
+  }
+
+  public SqlNode createCall(SqlNode tableRef, List<SqlNode> paramList)
+  {
+    SqlNode[] argArray = new SqlNode[paramList.size()];
+    // Not entirely valid to use this operator for two purposes. But, since
+    // we're going to rewrite the clause, should be OK.
+    SqlBasicCall args = new SqlBasicCall(this, paramList.toArray(argArray), Span.of(paramList).pos());
+    // TODO Auto-generated method stub
+    return createCall(Span.of(tableRef, args).pos(), ImmutableList.of(tableRef, args));
+  }
+
+  @Override
+  public SqlNode rewriteCall(SqlValidator validator, SqlCall call)
+  {
+    return call;
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/external/UserDefinedTableMacroFunction.java b/sql/src/main/java/org/apache/druid/sql/calcite/external/UserDefinedTableMacroFunction.java
new file mode 100644
index 000000000000..26c6c4dd80ba
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/external/UserDefinedTableMacroFunction.java
@@ -0,0 +1,261 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.external;
+
+import org.apache.calcite.rel.type.RelDataType;
+import org.apache.calcite.schema.FunctionParameter;
+import org.apache.calcite.schema.TableMacro;
+import org.apache.calcite.schema.TranslatableTable;
+import org.apache.calcite.sql.SqlBasicCall;
+import org.apache.calcite.sql.SqlCall;
+import org.apache.calcite.sql.SqlIdentifier;
+import org.apache.calcite.sql.SqlNode;
+import org.apache.calcite.sql.SqlNodeList;
+import org.apache.calcite.sql.SqlOperator;
+import org.apache.calcite.sql.SqlWriter;
+import org.apache.calcite.sql.SqlWriter.Frame;
+import org.apache.calcite.sql.parser.SqlParserPos;
+import org.apache.calcite.sql.type.ReturnTypes;
+import org.apache.calcite.sql.type.SqlOperandTypeChecker;
+import org.apache.calcite.sql.type.SqlOperandTypeInference;
+import org.apache.calcite.sql.type.SqlReturnTypeInference;
+import org.apache.calcite.sql.validate.SqlUserDefinedTableMacro;
+import org.apache.druid.server.security.ResourceAction;
+import org.apache.druid.sql.calcite.expression.AuthorizableOperator;
+
+import java.util.List;
+import java.util.Set;
+
+/**
+ * Table macro designed for use with the Druid EXTEND operator. Example:
+ * <code><pre>
+ * INSERT INTO dst
+ * SELECT *
+ * FROM TABLE(staged(
+ *    source => 'inline',
+ *    format => 'csv',
+ *    data => 'a,b,1
+ * c,d,2
+ * '
+ *   ))
+ *   EXTEND (x VARCHAR, y VARCHAR, z BIGINT)
+ * PARTITIONED BY ALL TIME
+ * </pre></code>
+ * <p>
+ * Calcite supports the Apache Phoenix EXTEND operator of the form:
+ * <code><pre>
+ * SELECT ..
+ * FROM myTable EXTEND (x VARCHAR, ...)
+ * </pre></code>
+ * Though, oddly, a search of Apache Phoenix itself does not find a hit for
+ * EXTEND, so perhaps the feature was never completed?
+ * <p>
+ * For Druid, we want the above form: extend a table function, not a
+ * literal table. Since we can't change the Calcite parser, we instead use
+ * tricks within the constraints of the parser.
+ * <ul>
+ * <li>First, use use a Python script to modify the parser to add the
+ * EXTEND rule for a table function.</li>
+ * <li>Calcite expects the EXTEND operator to have two arguments: an identifier
+ * and the column list. Since our case has a function call as the first argument,
+ * we can't let Calcite see our AST. So, we use a rewrite trick to convert the
+ * EXTEND node into the usual TABLE(.) node, and we modify the associated macro
+ * to hold onto the schema, which is now out of sight of Calcite, and so will not
+ * cause problems with rules that don't understand our usage.</li>
+ * <li>Calcite will helpfully rewrite calls, replacing our modified operator with
+ * the original. So, we override those to keep our modified operator.</li>
+ * <li>When asked to produce a table ({@code apply(.)}), we call a Druid-specific
+ * version that passes along the schema saved previously.</li>
+ * <li>The extended {@code DruidTableMacro} uses the schema to define the
+ * input source.</li>
+ * <li>Care is taken that the same {@code DruidTableMacro} can be used without
+ * EXTEND. In this case, the schema will be empty and the input source must have
+ * a way of providing the schema. The batch ingest feature does not yet support
+ * this use case, but it seems a reasonable extension. Example: CSV that has a
+ * header row, or a "classic" lookup table that, by definition, has only two
+ * columns.</li>
+ * </ul>
+ * <p>
+ * Note that unparsing is a bit of a nuisance. Our trick places the EXTEND
+ * list in the wrong place, and we'll unparse SQL as:
+ * <code><pre>
+ * FROM TABLE(fn(arg1, arg2) EXTEND (x VARCHAR, ...))
+ * </pre></code>
+ * Since we seldom use unparse, we can perhaps live with this limitation for now.
+ */
+public abstract class UserDefinedTableMacroFunction extends SqlUserDefinedTableMacro implements AuthorizableOperator
+{
+  protected final ExtendedTableMacro macro;
+
+  public UserDefinedTableMacroFunction(
+      SqlIdentifier opName,
+      SqlReturnTypeInference returnTypeInference,
+      SqlOperandTypeInference operandTypeInference,
+      SqlOperandTypeChecker operandTypeChecker,
+      List<RelDataType> paramTypes,
+      ExtendedTableMacro tableMacro
+  )
+  {
+    super(opName, returnTypeInference, operandTypeInference, operandTypeChecker, paramTypes, tableMacro);
+
+    // Because Calcite's copy of the macro is private
+    this.macro = tableMacro;
+  }
+
+  /**
+   * Rewrite the call to the original table macro function to a new "shim" version that
+   * holds both the original one and the schema from EXTEND.
+   */
+  public SqlBasicCall rewriteCall(SqlBasicCall oldCall, SqlNodeList schema)
+  {
+    return new ExtendedCall(oldCall, new ShimTableMacroFunction(this, schema));
+  }
+
+  private static class ShimTableMacroFunction extends SqlUserDefinedTableMacro implements AuthorizableOperator
+  {
+    protected final UserDefinedTableMacroFunction base;
+    protected final SqlNodeList schema;
+
+    public ShimTableMacroFunction(final UserDefinedTableMacroFunction base, final SqlNodeList schema)
+    {
+      super(
+          base.getNameAsId(),
+          ReturnTypes.CURSOR,
+          null,
+          base.getOperandTypeChecker(),
+          base.getParamTypes(),
+          new ShimTableMacro(base.macro, schema)
+      );
+      this.base = base;
+      this.schema = schema;
+    }
+
+    @Override
+    public Set<ResourceAction> computeResources(final SqlCall call)
+    {
+      return base.computeResources(call);
+    }
+  }
+
+  /**
+   * Call primarily to (nearly) recreate the EXTEND clause during unparse.
+   */
+  private static class ExtendedCall extends SqlBasicCall
+  {
+    private final SqlNodeList schema;
+
+    public ExtendedCall(SqlBasicCall oldCall, ShimTableMacroFunction macro)
+    {
+      super(
+          macro,
+          oldCall.getOperands(),
+          oldCall.getParserPosition(),
+          false,
+          oldCall.getFunctionQuantifier()
+      );
+      this.schema = macro.schema;
+    }
+
+    public ExtendedCall(ExtendedCall from, SqlParserPos pos)
+    {
+      super(
+          from.getOperator(),
+          from.getOperands(),
+          pos,
+          false,
+          from.getFunctionQuantifier()
+      );
+      this.schema = from.schema;
+    }
+
+    /**
+     * Politely decline to revise the operator: we want the one we
+     * constructed to hold the schema, not the one re-resolved during
+     * validation.
+     */
+    @Override
+    public void setOperator(SqlOperator operator)
+    {
+      // Do nothing: do not call super.setOperator().
+    }
+
+    @Override
+    public SqlNode clone(SqlParserPos pos)
+    {
+      return new ExtendedCall(this, pos);
+    }
+
+    @Override
+    public void unparse(
+        SqlWriter writer,
+        int leftPrec,
+        int rightPrec)
+    {
+      super.unparse(writer, leftPrec, rightPrec);
+      writer.keyword("EXTEND");
+      Frame frame = writer.startList("(", ")");
+      schema.unparse(writer, leftPrec, rightPrec);
+      writer.endList(frame);
+    }
+  }
+
+  public interface ExtendedTableMacro extends TableMacro
+  {
+    TranslatableTable apply(List<Object> arguments, SqlNodeList schema);
+  }
+
+  /**
+   * Calcite table macro created dynamically to squirrel away the
+   * schema provided by the EXTEND clause to allow <pre><code>
+   * SELECT ... FROM TABLE(fn(arg => value, ...)) (col1 <type1>, ...)
+   * </code></pre>
+   * This macro wraps the actual input table macro, which does the
+   * actual work to build the Druid table. This macro also caches the
+   * translated table to avoid the need to recompute the table multiple
+   * times.
+   */
+  protected static class ShimTableMacro implements TableMacro
+  {
+    private final ExtendedTableMacro delegate;
+    private final SqlNodeList schema;
+    private TranslatableTable table;
+
+    public ShimTableMacro(ExtendedTableMacro delegate, SqlNodeList schema)
+    {
+      this.delegate = delegate;
+      this.schema = schema;
+    }
+
+    @Override
+    public TranslatableTable apply(List<Object> arguments)
+    {
+      if (table == null) {
+        table = delegate.apply(arguments, schema);
+      }
+      return table;
+    }
+
+    @Override
+    public List<FunctionParameter> getParameters()
+    {
+      return delegate.getParameters();
+    }
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalciteRulesManager.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalciteRulesManager.java
index 088a9cb861b1..e2b91f7d79a8 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalciteRulesManager.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/CalciteRulesManager.java
@@ -206,6 +206,7 @@ public class CalciteRulesManager
   /**
    * Manages the rules for planning of SQL queries via Calcite. Also provides methods for extensions to provide custom
    * rules for planning.
+   *
    * @param extensionCalciteRuleProviderSet the set of custom rules coming from extensions
    */
   @Inject
@@ -265,11 +266,11 @@ public List<RelOptRule> druidConventionRuleSet(final PlannerContext plannerConte
   public List<RelOptRule> bindableConventionRuleSet(final PlannerContext plannerContext)
   {
     return ImmutableList.<RelOptRule>builder()
-        .addAll(baseRuleSet(plannerContext))
-        .addAll(Bindables.RULES)
-        .addAll(DEFAULT_BINDABLE_RULES)
-        .add(AggregateReduceFunctionsRule.INSTANCE)
-        .build();
+                        .addAll(baseRuleSet(plannerContext))
+                        .addAll(Bindables.RULES)
+                        .addAll(DEFAULT_BINDABLE_RULES)
+                        .add(AggregateReduceFunctionsRule.INSTANCE)
+                        .build();
   }
 
   public List<RelOptRule> baseRuleSet(final PlannerContext plannerContext)
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidOperatorTable.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidOperatorTable.java
index 2431fc4accb5..971f21a87152 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidOperatorTable.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidOperatorTable.java
@@ -54,6 +54,7 @@
 import org.apache.druid.sql.calcite.expression.UnaryFunctionOperatorConversion;
 import org.apache.druid.sql.calcite.expression.UnaryPrefixOperatorConversion;
 import org.apache.druid.sql.calcite.expression.UnarySuffixOperatorConversion;
+import org.apache.druid.sql.calcite.expression.WindowSqlAggregate;
 import org.apache.druid.sql.calcite.expression.builtin.ArrayAppendOperatorConversion;
 import org.apache.druid.sql.calcite.expression.builtin.ArrayConcatOperatorConversion;
 import org.apache.druid.sql.calcite.expression.builtin.ArrayConstructorOperatorConversion;
@@ -135,6 +136,16 @@ public class DruidOperatorTable implements SqlOperatorTable
   // COUNT and APPROX_COUNT_DISTINCT are not here because they are added by SqlAggregationModule.
   private static final List<SqlAggregator> STANDARD_AGGREGATORS =
       ImmutableList.<SqlAggregator>builder()
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.LAG))
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.LEAD))
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.FIRST_VALUE))
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.LAST_VALUE))
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.CUME_DIST))
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.DENSE_RANK))
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.NTILE))
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.PERCENT_RANK))
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.RANK))
+                   .add(new WindowSqlAggregate(SqlStdOperatorTable.ROW_NUMBER))
                    .add(new BuiltinApproxCountDistinctSqlAggregator())
                    .add(new AvgSqlAggregator())
                    .add(EarliestLatestAnySqlAggregator.EARLIEST)
@@ -413,7 +424,7 @@ public DruidOperatorTable(
     for (SqlAggregator aggregator : aggregators) {
       final OperatorKey operatorKey = OperatorKey.of(aggregator.calciteFunction());
       if (this.aggregators.put(operatorKey, aggregator) != null) {
-        throw new ISE("Cannot have two operators with key[%s]", operatorKey);
+        throw new ISE("Cannot have two operators with key [%s]", operatorKey);
       }
     }
 
@@ -428,7 +439,7 @@ public DruidOperatorTable(
       final OperatorKey operatorKey = OperatorKey.of(operatorConversion.calciteOperator());
       if (this.aggregators.containsKey(operatorKey)
           || this.operatorConversions.put(operatorKey, operatorConversion) != null) {
-        throw new ISE("Cannot have two operators with key[%s]", operatorKey);
+        throw new ISE("Cannot have two operators with key [%s]", operatorKey);
       }
     }
 
@@ -546,16 +557,6 @@ public static OperatorKey of(final SqlOperator operator)
       return new OperatorKey(operator.getName(), operator.getSyntax());
     }
 
-    public String getName()
-    {
-      return name;
-    }
-
-    public SqlSyntax getSyntax()
-    {
-      return syntax;
-    }
-
     @Override
     public boolean equals(final Object o)
     {
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidPlanner.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidPlanner.java
index 1d34713c9e86..b0912507a278 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidPlanner.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidPlanner.java
@@ -94,6 +94,7 @@ public AuthResult(
   private final CalcitePlanner planner;
   private final PlannerContext plannerContext;
   private final SqlEngine engine;
+  private final PlannerHook hook;
   private State state = State.START;
   private SqlStatementHandler handler;
   private boolean authorized;
@@ -101,13 +102,15 @@ public AuthResult(
   DruidPlanner(
       final FrameworkConfig frameworkConfig,
       final PlannerContext plannerContext,
-      final SqlEngine engine
+      final SqlEngine engine,
+      final PlannerHook hook
   )
   {
     this.frameworkConfig = frameworkConfig;
     this.planner = new CalcitePlanner(frameworkConfig);
     this.plannerContext = plannerContext;
     this.engine = engine;
+    this.hook = hook == null ? NoOpPlannerHook.INSTANCE : hook;
   }
 
   /**
@@ -124,7 +127,9 @@ public void validate() throws SqlParseException, ValidationException
     engine.validateContext(plannerContext.queryContextMap());
 
     // Parse the query string.
-    SqlNode root = planner.parse(plannerContext.getSql());
+    String sql = plannerContext.getSql();
+    hook.captureSql(sql);
+    SqlNode root = planner.parse(sql);
     handler = createHandler(root);
 
     try {
@@ -162,7 +167,6 @@ private SqlStatementHandler createHandler(final SqlNode node) throws ValidationE
     throw new ValidationException(StringUtils.format("Cannot execute [%s].", node.getKind()));
   }
 
-
   /**
    * Prepare a SQL query for execution, including some initial parsing and
    * validation and any dynamic parameter type resolution, to support prepared
@@ -295,5 +299,11 @@ public DateTimeZone timeZone()
     {
       return plannerContext.getTimeZone();
     }
+
+    @Override
+    public PlannerHook hook()
+    {
+      return hook;
+    }
   }
 }
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidTypeSystem.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidTypeSystem.java
index f88d4dbfb38a..1279667ad65f 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidTypeSystem.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/DruidTypeSystem.java
@@ -22,11 +22,13 @@
 import org.apache.calcite.rel.type.RelDataType;
 import org.apache.calcite.rel.type.RelDataTypeFactory;
 import org.apache.calcite.rel.type.RelDataTypeSystem;
+import org.apache.calcite.sql.type.SqlTypeFactoryImpl;
 import org.apache.calcite.sql.type.SqlTypeName;
 
 public class DruidTypeSystem implements RelDataTypeSystem
 {
   public static final DruidTypeSystem INSTANCE = new DruidTypeSystem();
+  public static final RelDataTypeFactory TYPE_FACTORY = new SqlTypeFactoryImpl(DruidTypeSystem.INSTANCE);
 
   /**
    * Druid uses millisecond precision for timestamps internally. This is also the default at the SQL layer.
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/IngestHandler.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/IngestHandler.java
index 80dad64f89f2..f2d98fb70cde 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/IngestHandler.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/IngestHandler.java
@@ -74,6 +74,7 @@ public abstract class IngestHandler extends QueryHandler
   {
     super(handlerContext, queryNode, explain);
     this.ingestionGranularity = ingestNode.getPartitionedBy();
+    handlerContext.hook().captureInsert(ingestNode);
   }
 
   protected static SqlNode convertQuery(DruidSqlIngest sqlNode) throws ValidationException
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/NoOpPlannerHook.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/NoOpPlannerHook.java
new file mode 100644
index 000000000000..65b0dccef0d5
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/NoOpPlannerHook.java
@@ -0,0 +1,61 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.planner;
+
+import org.apache.calcite.interpreter.BindableRel;
+import org.apache.calcite.rel.RelRoot;
+import org.apache.calcite.rel.type.RelDataType;
+import org.apache.calcite.sql.SqlInsert;
+import org.apache.druid.sql.calcite.rel.DruidRel;
+
+public class NoOpPlannerHook implements PlannerHook
+{
+  public static final NoOpPlannerHook INSTANCE = new NoOpPlannerHook();
+
+  @Override
+  public void captureSql(String sql)
+  {
+  }
+
+  @Override
+  public void captureQueryRel(RelRoot rootQueryRel)
+  {
+  }
+
+  @Override
+  public void captureDruidRel(DruidRel<?> druidRel)
+  {
+  }
+
+  @Override
+  public void captureBindableRel(BindableRel bindableRel)
+  {
+  }
+
+  @Override
+  public void captureParameterTypes(RelDataType parameterTypes)
+  {
+  }
+
+  @Override
+  public void captureInsert(SqlInsert insert)
+  {
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerCaptureHook.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerCaptureHook.java
new file mode 100644
index 000000000000..bdf50a8a0c58
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerCaptureHook.java
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.planner;
+
+import org.apache.calcite.interpreter.BindableRel;
+import org.apache.calcite.rel.RelRoot;
+import org.apache.calcite.rel.type.RelDataType;
+import org.apache.calcite.sql.SqlInsert;
+import org.apache.druid.sql.calcite.rel.DruidRel;
+
+public class PlannerCaptureHook implements PlannerHook
+{
+  private RelRoot relRoot;
+  private SqlInsert insertNode;
+
+  @Override
+  public void captureSql(String sql)
+  {
+    // Not used at present. Add a field to capture this if you need it.
+  }
+
+  @Override
+  public void captureQueryRel(RelRoot rootQueryRel)
+  {
+    this.relRoot = rootQueryRel;
+  }
+
+  @Override
+  public void captureDruidRel(DruidRel<?> druidRel)
+  {
+    // Not used at present. Add a field to capture this if you need it.
+  }
+
+  @Override
+  public void captureBindableRel(BindableRel bindableRel)
+  {
+    // Not used at present. Add a field to capture this if you need it.
+  }
+
+  @Override
+  public void captureParameterTypes(RelDataType parameterTypes)
+  {
+    // Not used at present. Add a field to capture this if you need it.
+  }
+
+  @Override
+  public void captureInsert(SqlInsert insert)
+  {
+    this.insertNode = insert;
+  }
+
+  public RelRoot relRoot()
+  {
+    return relRoot;
+  }
+
+  public SqlInsert insertNode()
+  {
+    return insertNode;
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerFactory.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerFactory.java
index 1e8a6c57a029..3cbc20dd05dd 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerFactory.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerFactory.java
@@ -104,7 +104,8 @@ public PlannerFactory(
   public DruidPlanner createPlanner(
       final SqlEngine engine,
       final String sql,
-      final Map<String, Object> queryContext
+      final Map<String, Object> queryContext,
+      final PlannerHook hook
   )
   {
     final PlannerContext context = PlannerContext.create(
@@ -119,7 +120,7 @@ public DruidPlanner createPlanner(
         joinableFactoryWrapper
     );
 
-    return new DruidPlanner(buildFrameworkConfig(context), context, engine);
+    return new DruidPlanner(buildFrameworkConfig(context), context, engine, hook);
   }
 
   /**
@@ -129,7 +130,7 @@ public DruidPlanner createPlanner(
   @VisibleForTesting
   public DruidPlanner createPlannerForTesting(final SqlEngine engine, final String sql, final Map<String, Object> queryContext)
   {
-    final DruidPlanner thePlanner = createPlanner(engine, sql, queryContext);
+    final DruidPlanner thePlanner = createPlanner(engine, sql, queryContext, null);
     thePlanner.getPlannerContext()
               .setAuthenticationResult(NoopEscalator.getInstance().createEscalatedAuthenticationResult());
     try {
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerHook.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerHook.java
new file mode 100644
index 000000000000..a65f59d4d1c7
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/PlannerHook.java
@@ -0,0 +1,43 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.planner;
+
+import org.apache.calcite.interpreter.BindableRel;
+import org.apache.calcite.rel.RelRoot;
+import org.apache.calcite.rel.type.RelDataType;
+import org.apache.calcite.sql.SqlInsert;
+import org.apache.druid.sql.calcite.rel.DruidRel;
+
+/**
+ * Druid-specific version of Calcite's {@link org.apache.calcite.runtime.Hook Hook}
+ * class. Captures artifacts of interest in the Druid planning process, generally
+ * for test validation. Calcite's hook has multiple low-level events, but, sadly,
+ * none at the points where tests want to verify, except for the opportunity to
+ * capture the native query.
+ */
+public interface PlannerHook
+{
+  void captureSql(String sql);
+  void captureQueryRel(RelRoot rootQueryRel);
+  void captureDruidRel(DruidRel<?> druidRel);
+  void captureBindableRel(BindableRel bindableRel);
+  void captureParameterTypes(RelDataType parameterTypes);
+  void captureInsert(SqlInsert insert);
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/QueryHandler.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/QueryHandler.java
index eb1bd43ff625..13daa80da129 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/QueryHandler.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/QueryHandler.java
@@ -146,9 +146,11 @@ public void prepare()
     }
     isPrepared = true;
     rootQueryRel = handlerContext.planner().rel(validatedQueryNode);
+    handlerContext.hook().captureQueryRel(rootQueryRel);
     final RelDataTypeFactory typeFactory = rootQueryRel.rel.getCluster().getTypeFactory();
     final SqlValidator validator = handlerContext.planner().getValidator();
     final RelDataType parameterTypes = validator.getParameterRowType(validatedQueryNode);
+    handlerContext.hook().captureParameterTypes(parameterTypes);
     final RelDataType returnedRowType;
 
     if (explain != null) {
@@ -291,6 +293,7 @@ private PlannerResult planWithBindableConvention()
       );
     }
 
+    handlerContext.hook().captureBindableRel(bindableRel);
     PlannerContext plannerContext = handlerContext.plannerContext();
     if (explain != null) {
       return planExplanation(bindableRel, false);
@@ -466,6 +469,7 @@ private void flattenOutermostRel(DruidRel<?> druidRel, List<DruidRel<?>> flatten
   protected PlannerResult planWithDruidConvention() throws ValidationException
   {
     final RelRoot possiblyLimitedRoot = possiblyWrapRootWithOuterLimitFromContext(rootQueryRel);
+    handlerContext.hook().captureQueryRel(possiblyLimitedRoot);
     final QueryMaker queryMaker = buildQueryMaker(possiblyLimitedRoot);
     PlannerContext plannerContext = handlerContext.plannerContext();
     plannerContext.setQueryMaker(queryMaker);
@@ -490,6 +494,7 @@ protected PlannerResult planWithDruidConvention() throws ValidationException
                .plus(rootQueryRel.collation),
         parameterized
     );
+    handlerContext.hook().captureDruidRel(druidRel);
 
     if (explain != null) {
       return planExplanation(druidRel, true);
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/planner/SqlStatementHandler.java b/sql/src/main/java/org/apache/druid/sql/calcite/planner/SqlStatementHandler.java
index 9185b9862f33..af28ceb3b979 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/planner/SqlStatementHandler.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/planner/SqlStatementHandler.java
@@ -57,6 +57,7 @@ interface HandlerContext
     SchemaPlus defaultSchema();
     ObjectMapper jsonMapper();
     DateTimeZone timeZone();
+    PlannerHook hook();
   }
 
   abstract class BaseStatementHandler implements SqlStatementHandler
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidQuery.java b/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidQuery.java
index 8c5aa588f708..f4601c03b37c 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidQuery.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/rel/DruidQuery.java
@@ -49,6 +49,7 @@
 import org.apache.druid.query.DataSource;
 import org.apache.druid.query.JoinDataSource;
 import org.apache.druid.query.Query;
+import org.apache.druid.query.QueryContext;
 import org.apache.druid.query.QueryDataSource;
 import org.apache.druid.query.aggregation.AggregatorFactory;
 import org.apache.druid.query.aggregation.LongMaxAggregatorFactory;
@@ -61,6 +62,7 @@
 import org.apache.druid.query.groupby.having.DimFilterHavingSpec;
 import org.apache.druid.query.groupby.orderby.DefaultLimitSpec;
 import org.apache.druid.query.groupby.orderby.OrderByColumnSpec;
+import org.apache.druid.query.operator.WindowOperatorQuery;
 import org.apache.druid.query.ordering.StringComparator;
 import org.apache.druid.query.ordering.StringComparators;
 import org.apache.druid.query.planning.DataSourceAnalysis;
@@ -97,7 +99,6 @@
 
 import javax.annotation.Nonnull;
 import javax.annotation.Nullable;
-
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.Comparator;
@@ -124,10 +125,11 @@ public class DruidQuery
 
   /**
    * Maximum number of time-granular buckets that we allow for non-Druid tables.
-   *
+   * <p>
    * Used by {@link #canUseQueryGranularity}.
    */
   private static final int MAX_TIME_GRAINS_NON_DRUID_TABLE = 100000;
+  public static final String CTX_ENABLE_WINDOW_FNS = "windowsAreForClosers";
 
   private final DataSource dataSource;
   private final PlannerContext plannerContext;
@@ -144,6 +146,9 @@ public class DruidQuery
   @Nullable
   private final Sorting sorting;
 
+  @Nullable
+  private final Windowing windowing;
+
   private final Query<?> query;
   private final RowSignature outputRowSignature;
   private final RelDataType outputRowType;
@@ -157,6 +162,7 @@ private DruidQuery(
       @Nullable final Projection selectProjection,
       @Nullable final Grouping grouping,
       @Nullable final Sorting sorting,
+      @Nullable final Windowing windowing,
       final RowSignature sourceRowSignature,
       final RelDataType outputRowType,
       final VirtualColumnRegistry virtualColumnRegistry
@@ -168,9 +174,16 @@ private DruidQuery(
     this.selectProjection = selectProjection;
     this.grouping = grouping;
     this.sorting = sorting;
+    this.windowing = windowing;
     this.sourceRowSignature = sourceRowSignature;
 
-    this.outputRowSignature = computeOutputRowSignature(sourceRowSignature, selectProjection, grouping, sorting);
+    this.outputRowSignature = computeOutputRowSignature(
+        sourceRowSignature,
+        selectProjection,
+        grouping,
+        sorting,
+        windowing
+    );
     this.outputRowType = Preconditions.checkNotNull(outputRowType, "outputRowType");
     this.virtualColumnRegistry = Preconditions.checkNotNull(virtualColumnRegistry, "virtualColumnRegistry");
     this.query = computeQuery();
@@ -200,6 +213,7 @@ public static DruidQuery fromPartialQuery(
     final Projection selectProjection;
     final Grouping grouping;
     final Sorting sorting;
+    final Windowing windowing;
 
     if (partialQuery.getWhereFilter() != null) {
       filter = Preconditions.checkNotNull(
@@ -221,7 +235,7 @@ public static DruidQuery fromPartialQuery(
           computeSelectProjection(
               partialQuery,
               plannerContext,
-              computeOutputRowSignature(sourceRowSignature, null, null, null),
+              computeOutputRowSignature(sourceRowSignature, null, null, null, null),
               virtualColumnRegistry
           )
       );
@@ -234,7 +248,7 @@ public static DruidQuery fromPartialQuery(
           computeGrouping(
               partialQuery,
               plannerContext,
-              computeOutputRowSignature(sourceRowSignature, null, null, null),
+              computeOutputRowSignature(sourceRowSignature, null, null, null, null),
               virtualColumnRegistry,
               rexBuilder,
               finalizeAggregations
@@ -249,7 +263,7 @@ public static DruidQuery fromPartialQuery(
           computeSorting(
               partialQuery,
               plannerContext,
-              computeOutputRowSignature(sourceRowSignature, selectProjection, grouping, null),
+              computeOutputRowSignature(sourceRowSignature, selectProjection, grouping, null, null),
               // When sorting follows grouping, virtual columns cannot be used
               partialQuery.getAggregate() != null ? null : virtualColumnRegistry
           )
@@ -258,6 +272,25 @@ public static DruidQuery fromPartialQuery(
       sorting = null;
     }
 
+    if (partialQuery.getWindow() != null) {
+      final QueryContext queryContext = plannerContext.queryContext();
+      if (queryContext.getBoolean(CTX_ENABLE_WINDOW_FNS, false)) {
+        windowing = Preconditions.checkNotNull(
+            Windowing.fromCalciteStuff(
+                partialQuery,
+                plannerContext,
+                sourceRowSignature, // Plans immediately after Scan, so safe to use the row signature from scan
+                rexBuilder
+            )
+        );
+      } else {
+        plannerContext.setPlanningError("Windowing Not Currently Supported");
+        throw new CannotBuildQueryException("Windowing Not Currently Supported");
+      }
+    } else {
+      windowing = null;
+    }
+
     return new DruidQuery(
         dataSource,
         plannerContext,
@@ -265,6 +298,7 @@ public static DruidQuery fromPartialQuery(
         selectProjection,
         grouping,
         sorting,
+        windowing,
         sourceRowSignature,
         outputRowType,
         virtualColumnRegistry
@@ -404,9 +438,7 @@ private static Grouping computeGrouping(
    * @param plannerContext        planner context
    * @param rowSignature          source row signature
    * @param virtualColumnRegistry re-usable virtual column references
-   *
    * @return dimensions
-   *
    * @throws CannotBuildQueryException if dimensions cannot be computed
    */
   private static List<DimensionExpression> computeDimensions(
@@ -438,7 +470,10 @@ private static List<DimensionExpression> computeDimensions(
       final ColumnType outputType = Calcites.getColumnTypeForRelDataType(dataType);
       if (Types.isNullOr(outputType, ValueType.COMPLEX)) {
         // Can't group on unknown or COMPLEX types.
-        plannerContext.setPlanningError("SQL requires a group-by on a column of type %s that is unsupported.", outputType);
+        plannerContext.setPlanningError(
+            "SQL requires a group-by on a column of type %s that is unsupported.",
+            outputType
+        );
         throw new CannotBuildQueryException(aggregate, rexNode);
       }
 
@@ -511,9 +546,7 @@ private static Subtotals computeSubtotals(
    * @param finalizeAggregations  true if this query should include explicit finalization for all of its
    *                              aggregators, where required. Useful for subqueries where Druid's native query layer
    *                              does not do this automatically.
-   *
    * @return aggregations
-   *
    * @throws CannotBuildQueryException if dimensions cannot be computed
    */
   private static List<Aggregation> computeAggregations(
@@ -631,10 +664,13 @@ private static RowSignature computeOutputRowSignature(
       final RowSignature sourceRowSignature,
       @Nullable final Projection selectProjection,
       @Nullable final Grouping grouping,
-      @Nullable final Sorting sorting
+      @Nullable final Sorting sorting,
+      @Nullable final Windowing windowing
   )
   {
-    if (sorting != null && sorting.getProjection() != null) {
+    if (windowing != null) {
+      return windowing.getSignature();
+    } else if (sorting != null && sorting.getProjection() != null) {
       return sorting.getProjection().getOutputRowSignature();
     } else if (grouping != null) {
       // Sanity check: cannot have both "grouping" and "selectProjection".
@@ -791,7 +827,7 @@ private static Filtration toFiltration(DimFilter filter, VirtualColumnRegistry v
 
   /**
    * Whether the provided combination of dataSource, filtration, and queryGranularity is safe to use in queries.
-   *
+   * <p>
    * Necessary because some combinations are unsafe, mainly because they would lead to the creation of too many
    * time-granular buckets during query processing.
    */
@@ -870,6 +906,11 @@ public Query<?> getQuery()
    */
   private Query<?> computeQuery()
   {
+    if (windowing != null) {
+      // Windowing can only be handled by window queries.
+      return toWindowQuery();
+    }
+
     if (dataSource instanceof QueryDataSource) {
       // If there is a subquery, then we prefer the outer query to be a groupBy if possible, since this potentially
       // enables more efficient execution. (The groupBy query toolchest can handle some subqueries by itself, without
@@ -1312,6 +1353,26 @@ private GroupByQuery toGroupByQuery()
     return query.withOverriddenContext(theContext);
   }
 
+  /**
+   * Return this query as a {@link WindowOperatorQuery}, or null if this query cannot be run that way.
+   *
+   * @return query or null
+   */
+  @Nullable
+  private WindowOperatorQuery toWindowQuery()
+  {
+    if (windowing == null) {
+      return null;
+    }
+
+    return new WindowOperatorQuery(
+        dataSource,
+        plannerContext.queryContextMap(),
+        windowing.getSignature(),
+        windowing.getOperators()
+    );
+  }
+
   /**
    * Return this query as a Scan query, or null if this query is not compatible with Scan.
    *
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/rel/PartialDruidQuery.java b/sql/src/main/java/org/apache/druid/sql/calcite/rel/PartialDruidQuery.java
index 15bcd5d4bdac..bdd4a4f735fa 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/rel/PartialDruidQuery.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/rel/PartialDruidQuery.java
@@ -28,6 +28,7 @@
 import org.apache.calcite.rel.core.Project;
 import org.apache.calcite.rel.core.RelFactories;
 import org.apache.calcite.rel.core.Sort;
+import org.apache.calcite.rel.core.Window;
 import org.apache.calcite.rel.type.RelDataType;
 import org.apache.calcite.rex.RexBuilder;
 import org.apache.calcite.rex.RexNode;
@@ -58,24 +59,28 @@ public class PartialDruidQuery
   private final Project aggregateProject;
   private final Sort sort;
   private final Project sortProject;
+  private final Window window;
 
   public enum Stage
   {
     // SCAN must be present on all queries.
     SCAN,
 
-    // WHERE_FILTER, SELECT_PROJECT may be present on any query.
+    // WHERE_FILTER, SELECT_PROJECT may be present on any query, except ones with WINDOW.
     WHERE_FILTER,
     SELECT_PROJECT,
 
-    // AGGREGATE, HAING_FILTER, AGGREGATE_PROJECT can only be present on aggregating queries.
+    // AGGREGATE, HAVING_FILTER, AGGREGATE_PROJECT can only be present on non-WINDOW aggregating queries.
     AGGREGATE,
     HAVING_FILTER,
     AGGREGATE_PROJECT,
 
-    // SORT, SORT_PROJECT may be present on any query.
+    // SORT, SORT_PROJECT may be present on any query, except ones with WINDOW.
     SORT,
-    SORT_PROJECT
+    SORT_PROJECT,
+
+    // WINDOW may be present only together with SCAN.
+    WINDOW
   }
 
   private PartialDruidQuery(
@@ -87,7 +92,8 @@ private PartialDruidQuery(
       final Project aggregateProject,
       final Filter havingFilter,
       final Sort sort,
-      final Project sortProject
+      final Project sortProject,
+      final Window window
   )
   {
     this.builderSupplier = Preconditions.checkNotNull(builderSupplier, "builderSupplier");
@@ -99,6 +105,7 @@ private PartialDruidQuery(
     this.havingFilter = havingFilter;
     this.sort = sort;
     this.sortProject = sortProject;
+    this.window = window;
   }
 
   public static PartialDruidQuery create(final RelNode scanRel)
@@ -107,7 +114,7 @@ public static PartialDruidQuery create(final RelNode scanRel)
         scanRel.getCluster(),
         scanRel.getTable() != null ? scanRel.getTable().getRelOptSchema() : null
     );
-    return new PartialDruidQuery(builderSupplier, scanRel, null, null, null, null, null, null, null);
+    return new PartialDruidQuery(builderSupplier, scanRel, null, null, null, null, null, null, null, null);
   }
 
   public RelNode getScan()
@@ -150,6 +157,11 @@ public Project getSortProject()
     return sortProject;
   }
 
+  public Window getWindow()
+  {
+    return window;
+  }
+
   public PartialDruidQuery withWhereFilter(final Filter newWhereFilter)
   {
     validateStage(Stage.WHERE_FILTER);
@@ -162,7 +174,8 @@ public PartialDruidQuery withWhereFilter(final Filter newWhereFilter)
         aggregateProject,
         havingFilter,
         sort,
-        sortProject
+        sortProject,
+        window
     );
   }
 
@@ -204,7 +217,8 @@ public PartialDruidQuery withSelectProject(final Project newSelectProject)
         aggregateProject,
         havingFilter,
         sort,
-        sortProject
+        sortProject,
+        window
     );
   }
 
@@ -220,7 +234,8 @@ public PartialDruidQuery withAggregate(final Aggregate newAggregate)
         aggregateProject,
         havingFilter,
         sort,
-        sortProject
+        sortProject,
+        window
     );
   }
 
@@ -236,7 +251,8 @@ public PartialDruidQuery withHavingFilter(final Filter newHavingFilter)
         aggregateProject,
         newHavingFilter,
         sort,
-        sortProject
+        sortProject,
+        window
     );
   }
 
@@ -252,7 +268,8 @@ public PartialDruidQuery withAggregateProject(final Project newAggregateProject)
         newAggregateProject,
         havingFilter,
         sort,
-        sortProject
+        sortProject,
+        window
     );
   }
 
@@ -268,7 +285,8 @@ public PartialDruidQuery withSort(final Sort newSort)
         aggregateProject,
         havingFilter,
         newSort,
-        sortProject
+        sortProject,
+        window
     );
   }
 
@@ -284,7 +302,25 @@ public PartialDruidQuery withSortProject(final Project newSortProject)
         aggregateProject,
         havingFilter,
         sort,
-        newSortProject
+        newSortProject,
+        window
+    );
+  }
+
+  public PartialDruidQuery withWindow(final Window newWindow)
+  {
+    validateStage(Stage.WINDOW);
+    return new PartialDruidQuery(
+        builderSupplier,
+        scan,
+        whereFilter,
+        selectProject,
+        aggregate,
+        aggregateProject,
+        havingFilter,
+        sort,
+        sortProject,
+        newWindow
     );
   }
 
@@ -341,7 +377,10 @@ public boolean canAccept(final Stage stage)
   {
     final Stage currentStage = stage();
 
-    if (currentStage == Stage.SELECT_PROJECT && stage == Stage.SELECT_PROJECT) {
+    if (stage == Stage.WINDOW) {
+      // Special case: WINDOW can only be provided along with SCAN.
+      return currentStage == Stage.SCAN;
+    } else if (currentStage == Stage.SELECT_PROJECT && stage == Stage.SELECT_PROJECT) {
       // Special case: allow layering SELECT_PROJECT on top of SELECT_PROJECT. Calcite's builtin rules cannot
       // always collapse these, so we have to (one example: testSemiJoinWithOuterTimeExtract). See
       // withSelectProject for the code here that handles this.
@@ -352,12 +391,9 @@ public boolean canAccept(final Stage stage)
     } else if (stage.compareTo(Stage.AGGREGATE) > 0 && stage.compareTo(Stage.SORT) < 0 && aggregate == null) {
       // Cannot do post-aggregation stages without an aggregation.
       return false;
-    } else if (stage.compareTo(Stage.SORT) > 0 && sort == null) {
-      // Cannot do post-sort stages without a sort.
-      return false;
     } else {
-      // Looks good.
-      return true;
+      // If we are after the SORT phase, make sure we have a sort...
+      return stage.compareTo(Stage.SORT) <= 0 || sort != null;
     }
   }
 
@@ -370,7 +406,9 @@ public boolean canAccept(final Stage stage)
   @SuppressWarnings("VariableNotUsedInsideIf")
   public Stage stage()
   {
-    if (sortProject != null) {
+    if (window != null) {
+      return Stage.WINDOW;
+    } else if (sortProject != null) {
       return Stage.SORT_PROJECT;
     } else if (sort != null) {
       return Stage.SORT;
@@ -399,6 +437,8 @@ public RelNode leafRel()
     final Stage currentStage = stage();
 
     switch (currentStage) {
+      case WINDOW:
+        return window;
       case SORT_PROJECT:
         return sortProject;
       case SORT:
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/rel/Windowing.java b/sql/src/main/java/org/apache/druid/sql/calcite/rel/Windowing.java
new file mode 100644
index 000000000000..5cbffc6d2a5b
--- /dev/null
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/rel/Windowing.java
@@ -0,0 +1,298 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.rel;
+
+import com.google.common.base.Preconditions;
+import com.google.common.collect.ImmutableMap;
+import com.google.common.collect.Iterables;
+import org.apache.calcite.rel.RelFieldCollation;
+import org.apache.calcite.rel.core.AggregateCall;
+import org.apache.calcite.rel.core.Project;
+import org.apache.calcite.rel.core.Window;
+import org.apache.calcite.rex.RexBuilder;
+import org.apache.calcite.rex.RexLiteral;
+import org.apache.calcite.rex.RexNode;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.query.aggregation.AggregatorFactory;
+import org.apache.druid.query.operator.NaivePartitioningOperatorFactory;
+import org.apache.druid.query.operator.OperatorFactory;
+import org.apache.druid.query.operator.WindowOperatorFactory;
+import org.apache.druid.query.operator.window.ComposingProcessor;
+import org.apache.druid.query.operator.window.Processor;
+import org.apache.druid.query.operator.window.WindowAggregateProcessor;
+import org.apache.druid.query.operator.window.ranking.WindowCumeDistProcessor;
+import org.apache.druid.query.operator.window.ranking.WindowDenseRankProcessor;
+import org.apache.druid.query.operator.window.ranking.WindowPercentileProcessor;
+import org.apache.druid.query.operator.window.ranking.WindowRankProcessor;
+import org.apache.druid.query.operator.window.ranking.WindowRowNumberProcessor;
+import org.apache.druid.query.operator.window.value.WindowFirstProcessor;
+import org.apache.druid.query.operator.window.value.WindowLastProcessor;
+import org.apache.druid.query.operator.window.value.WindowOffsetProcessor;
+import org.apache.druid.segment.column.RowSignature;
+import org.apache.druid.sql.calcite.aggregation.Aggregation;
+import org.apache.druid.sql.calcite.expression.DruidExpression;
+import org.apache.druid.sql.calcite.expression.Expressions;
+import org.apache.druid.sql.calcite.planner.Calcites;
+import org.apache.druid.sql.calcite.planner.PlannerContext;
+import org.apache.druid.sql.calcite.rule.GroupByRules;
+import org.apache.druid.sql.calcite.table.RowSignatures;
+
+import javax.annotation.Nonnull;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.List;
+
+/**
+ * Maps onto a {@link org.apache.druid.query.operator.WindowOperatorQuery}.
+ */
+public class Windowing
+{
+  private static final ImmutableMap<String, ProcessorMaker> KNOWN_WINDOW_FNS = ImmutableMap
+      .<String, ProcessorMaker>builder()
+      .put("LAG", (agg) -> new WindowOffsetProcessor(agg.getColumn(0), agg.getOutputName(), -agg.getConstantInt(1)))
+      .put("LEAD", (agg) -> new WindowOffsetProcessor(agg.getColumn(0), agg.getOutputName(), agg.getConstantInt(1)))
+      .put("FIRST_VALUE", (agg) -> new WindowFirstProcessor(agg.getColumn(0), agg.getOutputName()))
+      .put("LAST_VALUE", (agg) -> new WindowLastProcessor(agg.getColumn(0), agg.getOutputName()))
+      .put("CUME_DIST", (agg) -> new WindowCumeDistProcessor(agg.getOrderingColumns(), agg.getOutputName()))
+      .put("DENSE_RANK", (agg) -> new WindowDenseRankProcessor(agg.getOrderingColumns(), agg.getOutputName()))
+      .put("NTILE", (agg) -> new WindowPercentileProcessor(agg.getOutputName(), agg.getConstantInt(0)))
+      .put("PERCENT_RANK", (agg) -> new WindowRankProcessor(agg.getOrderingColumns(), agg.getOutputName(), true))
+      .put("RANK", (agg) -> new WindowRankProcessor(agg.getOrderingColumns(), agg.getOutputName(), false))
+      .put("ROW_NUMBER", (agg) -> new WindowRowNumberProcessor(agg.getOutputName()))
+      .build();
+  private final List<OperatorFactory> ops;
+
+  @Nonnull
+  public static Windowing fromCalciteStuff(
+      final PartialDruidQuery partialQuery,
+      final PlannerContext plannerContext,
+      final RowSignature rowSignature,
+      final RexBuilder rexBuilder
+  )
+  {
+    final Window window = Preconditions.checkNotNull(partialQuery.getWindow(), "window");
+
+    // TODO(gianm): insert sorts and split the groups up at the rule stage; by this time, we assume there's one
+    //   window and the dataset is already sorted appropriately.
+    if (window.groups.size() != 1) {
+      plannerContext.setPlanningError("Multiple windows are not supported");
+      throw new CannotBuildQueryException(window);
+    }
+    final Window.Group group = Iterables.getOnlyElement(window.groups);
+
+    // Window.
+    // TODO(gianm): Validate order-by keys instead of ignoring them.
+
+    final List<String> partitionColumns = new ArrayList<>();
+    for (int groupKey : group.keys) {
+      partitionColumns.add(rowSignature.getColumnName(groupKey));
+    }
+
+    // Frame.
+    // TODO(gianm): Validate ROWS vs RANGE instead of ignoring it.
+    // TODO(gianm): Support various other kinds of frames.
+    if (!group.lowerBound.isUnbounded()) {
+      plannerContext.setPlanningError("Lower bound [%s] is not supported", group.upperBound);
+      throw new CannotBuildQueryException(window);
+    }
+
+    final boolean cumulative;
+    if (group.upperBound.isUnbounded()) {
+      cumulative = false;
+    } else if (group.upperBound.isCurrentRow()) {
+      cumulative = true;
+    } else {
+      plannerContext.setPlanningError("Upper bound [%s] is not supported", group.upperBound);
+      throw new CannotBuildQueryException(window);
+    }
+
+    // Aggregations.
+    final String outputNamePrefix = Calcites.findUnusedPrefixForDigits("w", rowSignature.getColumnNames());
+    final List<AggregateCall> aggregateCalls = group.getAggregateCalls(window);
+
+    final List<Processor> processors = new ArrayList<>();
+    final List<AggregatorFactory> aggregations = new ArrayList<>();
+    final List<String> expectedOutputColumns = new ArrayList<>(rowSignature.getColumnNames());
+
+    for (int i = 0; i < aggregateCalls.size(); i++) {
+      final String aggName = outputNamePrefix + i;
+      expectedOutputColumns.add(aggName);
+
+      final AggregateCall aggCall = aggregateCalls.get(i);
+
+      ProcessorMaker maker = KNOWN_WINDOW_FNS.get(aggCall.getAggregation().getName());
+      if (maker == null) {
+        final Aggregation aggregation = GroupByRules.translateAggregateCall(
+            plannerContext,
+            rowSignature,
+            null,
+            rexBuilder,
+            partialQuery.getSelectProject(),
+            Collections.emptyList(),
+            aggName,
+            aggCall,
+            false // TODO: finalize in a separate operator
+        );
+
+        if (aggregation == null
+            || aggregation.getPostAggregator() != null
+            || aggregation.getAggregatorFactories().size() != 1) {
+          if (null == plannerContext.getPlanningError()) {
+            plannerContext.setPlanningError("Aggregation [%s] is not supported", aggCall);
+          }
+          throw new CannotBuildQueryException(window, aggCall);
+        }
+
+        aggregations.add(Iterables.getOnlyElement(aggregation.getAggregatorFactories()));
+      } else {
+        processors.add(maker.make(
+            new WindowAggregate(
+                aggName,
+                aggCall,
+                rowSignature,
+                plannerContext,
+                partialQuery.getSelectProject(),
+                window.constants,
+                group
+            )
+        ));
+      }
+    }
+
+    if (!aggregations.isEmpty()) {
+      if (cumulative) {
+        processors.add(new WindowAggregateProcessor(null, aggregations));
+      } else {
+        processors.add(new WindowAggregateProcessor(aggregations, null));
+      }
+    }
+
+    if (processors.isEmpty()) {
+      throw new ISE("No processors from Window[%s], why was this code called?", window);
+    }
+
+    final List<OperatorFactory> ops = Arrays.asList(
+        new NaivePartitioningOperatorFactory(partitionColumns),
+        new WindowOperatorFactory(
+            processors.size() == 1 ?
+            processors.get(0) : new ComposingProcessor(processors.toArray(new Processor[0]))
+        )
+    );
+
+    return new Windowing(
+        RowSignatures.fromRelDataType(expectedOutputColumns, window.getRowType()),
+        ops
+    );
+  }
+
+  private final RowSignature signature;
+
+  public Windowing(
+      final RowSignature signature,
+      List<OperatorFactory> ops
+  )
+  {
+    this.signature = signature;
+    this.ops = ops;
+  }
+
+  public RowSignature getSignature()
+  {
+    return signature;
+  }
+
+  public List<OperatorFactory> getOperators()
+  {
+    return ops;
+  }
+
+  private interface ProcessorMaker
+  {
+    Processor make(WindowAggregate agg);
+  }
+
+  private static class WindowAggregate
+  {
+    private final String outputName;
+    private final AggregateCall call;
+    private final RowSignature sig;
+    private final PlannerContext context;
+    private final Project project;
+    private final List<RexLiteral> constants;
+    private final Window.Group group;
+
+    private WindowAggregate(
+        String outputName,
+        AggregateCall call,
+        RowSignature sig,
+        PlannerContext context,
+        Project project,
+        List<RexLiteral> constants,
+        Window.Group group
+    )
+    {
+      this.outputName = outputName;
+      this.call = call;
+      this.sig = sig;
+      this.context = context;
+      this.project = project;
+      this.constants = constants;
+      this.group = group;
+
+      if (project != null) {
+        throw new ISE("Suddenly, the project[%s] is no longer null, the code might need to change.", project);
+      }
+    }
+
+    public String getOutputName()
+    {
+      return outputName;
+    }
+
+    public ArrayList<String> getOrderingColumns()
+    {
+      final List<RelFieldCollation> fields = group.orderKeys.getFieldCollations();
+      ArrayList<String> retVal = new ArrayList<>(fields.size());
+      for (RelFieldCollation field : fields) {
+        retVal.add(sig.getColumnName(field.getFieldIndex()));
+      }
+      return retVal;
+    }
+
+    public String getColumn(int argPosition)
+    {
+      RexNode columnArgument = Expressions.fromFieldAccess(sig, project, call.getArgList().get(argPosition));
+      final DruidExpression expression = Expressions.toDruidExpression(context, sig, columnArgument);
+      return expression.getDirectColumn();
+    }
+
+    public RexLiteral getConstantArgument(int argPosition)
+    {
+      final Integer constantIndex = call.getArgList().get(argPosition) - sig.size();
+      return constants.get(constantIndex);
+    }
+
+    public int getConstantInt(int argPosition)
+    {
+      return ((Number) getConstantArgument(argPosition).getValue()).intValue();
+    }
+  }
+}
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/rule/DruidRules.java b/sql/src/main/java/org/apache/druid/sql/calcite/rule/DruidRules.java
index 113f37d896fb..8316b1e9868d 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/rule/DruidRules.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/rule/DruidRules.java
@@ -28,12 +28,15 @@
 import org.apache.calcite.rel.core.Filter;
 import org.apache.calcite.rel.core.Project;
 import org.apache.calcite.rel.core.Sort;
+import org.apache.calcite.rel.core.Window;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.sql.calcite.planner.PlannerContext;
 import org.apache.druid.sql.calcite.rel.DruidOuterQueryRel;
+import org.apache.druid.sql.calcite.rel.DruidQuery;
 import org.apache.druid.sql.calcite.rel.DruidRel;
 import org.apache.druid.sql.calcite.rel.PartialDruidQuery;
 
+import java.util.ArrayList;
 import java.util.List;
 import java.util.function.BiFunction;
 import java.util.function.Predicate;
@@ -50,51 +53,59 @@ private DruidRules()
 
   public static List<RelOptRule> rules(PlannerContext plannerContext)
   {
-    return ImmutableList.of(
-        new DruidQueryRule<>(
-            Filter.class,
-            PartialDruidQuery.Stage.WHERE_FILTER,
-            PartialDruidQuery::withWhereFilter
-        ),
-        new DruidQueryRule<>(
-            Project.class,
-            PartialDruidQuery.Stage.SELECT_PROJECT,
-            PartialDruidQuery::withSelectProject
-        ),
-        new DruidQueryRule<>(
-            Aggregate.class,
-            PartialDruidQuery.Stage.AGGREGATE,
-            PartialDruidQuery::withAggregate
-        ),
-        new DruidQueryRule<>(
-            Project.class,
-            PartialDruidQuery.Stage.AGGREGATE_PROJECT,
-            PartialDruidQuery::withAggregateProject
-        ),
-        new DruidQueryRule<>(
-            Filter.class,
-            PartialDruidQuery.Stage.HAVING_FILTER,
-            PartialDruidQuery::withHavingFilter
-        ),
-        new DruidQueryRule<>(
-            Sort.class,
-            PartialDruidQuery.Stage.SORT,
-            PartialDruidQuery::withSort
-        ),
-        new DruidQueryRule<>(
-            Project.class,
-            PartialDruidQuery.Stage.SORT_PROJECT,
-            PartialDruidQuery::withSortProject
-        ),
-        DruidOuterQueryRule.AGGREGATE,
-        DruidOuterQueryRule.WHERE_FILTER,
-        DruidOuterQueryRule.SELECT_PROJECT,
-        DruidOuterQueryRule.SORT,
-        new DruidUnionRule(plannerContext),
-        new DruidUnionDataSourceRule(plannerContext),
-        DruidSortUnionRule.instance(),
-        DruidJoinRule.instance(plannerContext)
+    final ArrayList<RelOptRule> retVal = new ArrayList<>(
+        ImmutableList.of(
+            new DruidQueryRule<>(
+                Filter.class,
+                PartialDruidQuery.Stage.WHERE_FILTER,
+                PartialDruidQuery::withWhereFilter
+            ),
+            new DruidQueryRule<>(
+                Project.class,
+                PartialDruidQuery.Stage.SELECT_PROJECT,
+                PartialDruidQuery::withSelectProject
+            ),
+            new DruidQueryRule<>(
+                Aggregate.class,
+                PartialDruidQuery.Stage.AGGREGATE,
+                PartialDruidQuery::withAggregate
+            ),
+            new DruidQueryRule<>(
+                Project.class,
+                PartialDruidQuery.Stage.AGGREGATE_PROJECT,
+                PartialDruidQuery::withAggregateProject
+            ),
+            new DruidQueryRule<>(
+                Filter.class,
+                PartialDruidQuery.Stage.HAVING_FILTER,
+                PartialDruidQuery::withHavingFilter
+            ),
+            new DruidQueryRule<>(
+                Sort.class,
+                PartialDruidQuery.Stage.SORT,
+                PartialDruidQuery::withSort
+            ),
+            new DruidQueryRule<>(
+                Project.class,
+                PartialDruidQuery.Stage.SORT_PROJECT,
+                PartialDruidQuery::withSortProject
+            ),
+            DruidOuterQueryRule.AGGREGATE,
+            DruidOuterQueryRule.WHERE_FILTER,
+            DruidOuterQueryRule.SELECT_PROJECT,
+            DruidOuterQueryRule.SORT,
+            new DruidUnionRule(plannerContext),
+            new DruidUnionDataSourceRule(plannerContext),
+            DruidSortUnionRule.instance(),
+            DruidJoinRule.instance(plannerContext)
+        )
     );
+
+    if (plannerContext.queryContext().getBoolean(DruidQuery.CTX_ENABLE_WINDOW_FNS, false)) {
+      retVal.add(new DruidQueryRule<>(Window.class, PartialDruidQuery.Stage.WINDOW, PartialDruidQuery::withWindow));
+      retVal.add(DruidOuterQueryRule.WINDOW);
+    }
+    return retVal;
   }
 
   public static class DruidQueryRule<RelType extends RelNode> extends RelOptRule
@@ -228,6 +239,28 @@ public void onMatch(final RelOptRuleCall call)
       }
     };
 
+    public static final RelOptRule WINDOW = new DruidOuterQueryRule(
+        operand(Window.class, operandJ(DruidRel.class, null, CAN_BUILD_ON, any())),
+        "WINDOW"
+    )
+    {
+      @Override
+      public void onMatch(final RelOptRuleCall call)
+      {
+        final Window window = call.rel(0);
+        final DruidRel druidRel = call.rel(1);
+
+        final DruidOuterQueryRel outerQueryRel = DruidOuterQueryRel.create(
+            druidRel,
+            PartialDruidQuery.create(druidRel.getPartialDruidQuery().leafRel())
+                             .withWindow(window)
+        );
+        if (outerQueryRel.isValidDruidQuery()) {
+          call.transformTo(outerQueryRel);
+        }
+      }
+    };
+
     public DruidOuterQueryRule(final RelOptRuleOperand op, final String description)
     {
       super(op, StringUtils.format("%s(%s)", DruidOuterQueryRel.class.getSimpleName(), description));
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/rule/GroupByRules.java b/sql/src/main/java/org/apache/druid/sql/calcite/rule/GroupByRules.java
index cf596ce7f546..549c7899730a 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/rule/GroupByRules.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/rule/GroupByRules.java
@@ -34,6 +34,7 @@
 import org.apache.druid.sql.calcite.planner.PlannerContext;
 import org.apache.druid.sql.calcite.rel.VirtualColumnRegistry;
 
+import javax.annotation.Nullable;
 import java.util.ArrayList;
 import java.util.List;
 import java.util.Set;
@@ -54,7 +55,7 @@ private GroupByRules()
   public static Aggregation translateAggregateCall(
       final PlannerContext plannerContext,
       final RowSignature rowSignature,
-      final VirtualColumnRegistry virtualColumnRegistry,
+      @Nullable final VirtualColumnRegistry virtualColumnRegistry,
       final RexBuilder rexBuilder,
       final Project project,
       final List<Aggregation> existingAggregations,
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/run/NativeQueryMaker.java b/sql/src/main/java/org/apache/druid/sql/calcite/run/NativeQueryMaker.java
index a9fba5ee3580..258a744827a4 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/run/NativeQueryMaker.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/run/NativeQueryMaker.java
@@ -240,9 +240,8 @@ private <T> QueryResponse<Object[]> mapResultSequence(
       mapping[i] = idx;
     }
 
-    //noinspection unchecked
     final Sequence<Object[]> sequence = toolChest.resultsAsArrays(query, results.getResults());
-    return new QueryResponse(
+    return new QueryResponse<>(
         Sequences.map(
             sequence,
             array -> {
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/table/ExternalTable.java b/sql/src/main/java/org/apache/druid/sql/calcite/table/ExternalTable.java
index cc3ee7c3f6ae..bb98cd93b020 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/table/ExternalTable.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/table/ExternalTable.java
@@ -35,13 +35,18 @@
  * Each such table represents one of Druid's {@link DataSource} types. Since SQL
  * requires knowledge of the schema of that input source, the user must provide
  * that information in SQL (via the `EXTERN` or up-coming `STAGED` function) or
- * from the upcoming Druid Catalog.
+ * from the Druid Catalog.
  */
 public class ExternalTable extends DruidTable
 {
   private final DataSource dataSource;
   private final ObjectMapper objectMapper;
 
+  /**
+   * Cached row type, to avoid recreating types multiple times.
+   */
+  private RelDataType rowType;
+
   public ExternalTable(
       final DataSource dataSource,
       final RowSignature rowSignature,
@@ -74,11 +79,14 @@ public boolean isBroadcast()
   @Override
   public RelDataType getRowType(final RelDataTypeFactory typeFactory)
   {
-    // For external datasources, the row type should be determined by whatever the row signature has been explicitly
-    // passed in. Typecasting directly to SqlTypeName.TIMESTAMP will lead to inconsistencies with the Calcite functions
-    // For example, TIME_PARSE(__time) where __time is specified to be a string field in the external datasource
-    // would lead to an exception because __time would be interpreted as timestamp if we typecast it.
-    return RowSignatures.toRelDataType(getRowSignature(), typeFactory, true);
+    if (rowType == null) {
+      // For external datasources, the row type should be determined by whatever the row signature has been explicitly
+      // passed in. Typecasting directly to SqlTypeName.TIMESTAMP will lead to inconsistencies with the Calcite functions
+      // For example, TIME_PARSE(__time) where __time is specified to be a string field in the external datasource
+      // would lead to an exception because __time would be interpreted as timestamp if we typecast it.
+      rowType = RowSignatures.toRelDataType(getRowSignature(), typeFactory, true);
+    }
+    return rowType;
   }
 
   @Override
diff --git a/sql/src/main/java/org/apache/druid/sql/calcite/view/DruidViewMacro.java b/sql/src/main/java/org/apache/druid/sql/calcite/view/DruidViewMacro.java
index 75d82fa03fc9..e584108f9d6e 100644
--- a/sql/src/main/java/org/apache/druid/sql/calcite/view/DruidViewMacro.java
+++ b/sql/src/main/java/org/apache/druid/sql/calcite/view/DruidViewMacro.java
@@ -61,7 +61,10 @@ public TranslatableTable apply(final List<Object> arguments)
              plannerFactory.createPlanner(
                  ViewSqlEngine.INSTANCE,
                  viewSql,
-                 Collections.emptyMap())) {
+                 Collections.emptyMap(),
+                 null
+             )
+    ) {
       planner.validate();
       rowType = planner.prepare().getValidatedRowType();
     }
diff --git a/sql/src/main/java/org/apache/druid/sql/guice/SqlModule.java b/sql/src/main/java/org/apache/druid/sql/guice/SqlModule.java
index 614ed62339db..21a10bd695ff 100644
--- a/sql/src/main/java/org/apache/druid/sql/guice/SqlModule.java
+++ b/sql/src/main/java/org/apache/druid/sql/guice/SqlModule.java
@@ -26,6 +26,7 @@
 import com.google.inject.Key;
 import com.google.inject.Module;
 import com.google.inject.Provides;
+import org.apache.druid.catalog.model.TableDefnRegistry;
 import org.apache.druid.guice.LazySingleton;
 import org.apache.druid.guice.PolyBind;
 import org.apache.druid.guice.annotations.NativeQuery;
@@ -101,6 +102,8 @@ public void configure(Binder binder)
         NoopDruidSchemaManager.TYPE
     );
 
+    binder.bind(TableDefnRegistry.class).in(LazySingleton.class);
+
     binder.install(new DruidCalciteSchemaModule());
     binder.install(new CalcitePlannerModule());
     binder.install(new SqlAggregationModule());
diff --git a/sql/src/test/java/org/apache/druid/sql/avatica/DruidAvaticaHandlerTest.java b/sql/src/test/java/org/apache/druid/sql/avatica/DruidAvaticaHandlerTest.java
index 9db98505dc1f..748ed20ce3c5 100644
--- a/sql/src/test/java/org/apache/druid/sql/avatica/DruidAvaticaHandlerTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/avatica/DruidAvaticaHandlerTest.java
@@ -559,6 +559,12 @@ public void testDatabaseMetaDataTables() throws SQLException
                 Pair.of("TABLE_NAME", CalciteTests.USERVISITDATASOURCE),
                 Pair.of("TABLE_SCHEM", "druid"),
                 Pair.of("TABLE_TYPE", "TABLE")
+            ),
+            row(
+                Pair.of("TABLE_CAT", "druid"),
+                Pair.of("TABLE_NAME", "wikipedia"),
+                Pair.of("TABLE_SCHEM", "druid"),
+                Pair.of("TABLE_TYPE", "TABLE")
             )
         ),
         getRows(
@@ -633,6 +639,12 @@ public void testDatabaseMetaDataTablesAsSuperuser() throws SQLException
                 Pair.of("TABLE_NAME", CalciteTests.USERVISITDATASOURCE),
                 Pair.of("TABLE_SCHEM", "druid"),
                 Pair.of("TABLE_TYPE", "TABLE")
+            ),
+            row(
+                Pair.of("TABLE_CAT", "druid"),
+                Pair.of("TABLE_NAME", "wikipedia"),
+                Pair.of("TABLE_SCHEM", "druid"),
+                Pair.of("TABLE_TYPE", "TABLE")
             )
         ),
         getRows(
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java
index 150309e374b7..7254e84c51f8 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/BaseCalciteQueryTest.java
@@ -20,11 +20,10 @@
 package org.apache.druid.sql.calcite;
 
 import com.fasterxml.jackson.core.JsonProcessingException;
-import com.fasterxml.jackson.databind.Module;
 import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.base.Preconditions;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
+import com.google.inject.Injector;
 import org.apache.calcite.plan.RelOptPlanner;
 import org.apache.druid.annotations.UsedByJUnitParamsRunner;
 import org.apache.druid.common.config.NullHandling;
@@ -37,7 +36,6 @@
 import org.apache.druid.java.util.common.granularity.Granularity;
 import org.apache.druid.java.util.common.io.Closer;
 import org.apache.druid.java.util.common.logger.Logger;
-import org.apache.druid.math.expr.ExprMacroTable;
 import org.apache.druid.query.DataSource;
 import org.apache.druid.query.Druids;
 import org.apache.druid.query.JoinDataSource;
@@ -84,7 +82,6 @@
 import org.apache.druid.sql.SqlStatementFactory;
 import org.apache.druid.sql.calcite.expression.DruidExpression;
 import org.apache.druid.sql.calcite.planner.Calcites;
-import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.planner.PlannerConfig;
 import org.apache.druid.sql.calcite.planner.PlannerContext;
 import org.apache.druid.sql.calcite.planner.PlannerFactory;
@@ -117,13 +114,12 @@
 import org.junit.rules.TemporaryFolder;
 
 import javax.annotation.Nullable;
-
 import java.io.IOException;
-import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
+import java.util.Properties;
 import java.util.Set;
 import java.util.function.Consumer;
 import java.util.stream.Collectors;
@@ -488,7 +484,12 @@ protected static void resetFramework()
   @Rule
   public QueryLogHook getQueryLogHook()
   {
-    return queryLogHook = QueryLogHook.create(queryFramework().queryJsonMapper());
+    // Indirection for the JSON mapper. Otherwise, this rule method is called
+    // before Setup is called, causing the query framework to be built before
+    // tests have done their setup. The indirection means we access the query
+    // framework only when we log the first query. By then, the query framework
+    // will have been created via the normal path.
+    return queryLogHook = new QueryLogHook(() -> queryFramework().queryJsonMapper());
   }
 
   public SqlTestFramework queryFramework()
@@ -512,25 +513,31 @@ private void createFramework(int mergeBufferCount)
     resetFramework();
     try {
       baseComponentSupplier = new StandardComponentSupplier(
-          CalciteTests.INJECTOR,
-          temporaryFolder.newFolder());
+          temporaryFolder.newFolder()
+      );
     }
     catch (IOException e) {
       throw new RE(e);
     }
-    queryFramework = new SqlTestFramework.Builder(this)
+    SqlTestFramework.Builder builder = new SqlTestFramework.Builder(this)
         .minTopNThreshold(minTopNThreshold)
-        .mergeBufferCount(mergeBufferCount)
-        .build();
+        .mergeBufferCount(mergeBufferCount);
+    configureBuilder(builder);
+    queryFramework = builder.build();
+  }
+
+  protected void configureBuilder(Builder builder)
+  {
   }
 
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
-    return baseComponentSupplier.createQuerySegmentWalker(conglomerate, joinableFactory);
+    return baseComponentSupplier.createQuerySegmentWalker(conglomerate, joinableFactory, injector);
   }
 
   @Override
@@ -547,45 +554,39 @@ public SqlEngine createEngine(
   }
 
   @Override
-  public QueryRunnerFactoryConglomerate createCongolmerate(Builder builder, Closer closer)
+  public void gatherProperties(Properties properties)
   {
-    return baseComponentSupplier.createCongolmerate(builder, closer);
+    baseComponentSupplier.gatherProperties(properties);
   }
 
   @Override
-  public void configureJsonMapper(ObjectMapper mapper)
-  {
-    baseComponentSupplier.configureJsonMapper(mapper);
-  }
-
-  @Override
-  public DruidOperatorTable createOperatorTable()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    return baseComponentSupplier.createOperatorTable();
+    baseComponentSupplier.configureGuice(builder);
   }
 
   @Override
-  public ExprMacroTable createMacroTable()
+  public QueryRunnerFactoryConglomerate createCongolmerate(Builder builder, Closer closer)
   {
-    return baseComponentSupplier.createMacroTable();
+    return baseComponentSupplier.createCongolmerate(builder, closer);
   }
 
   @Override
-  public Map<String, Object> getJacksonInjectables()
+  public void configureJsonMapper(ObjectMapper mapper)
   {
-    return baseComponentSupplier.getJacksonInjectables();
+    baseComponentSupplier.configureJsonMapper(mapper);
   }
 
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public JoinableFactoryWrapper createJoinableFactoryWrapper(LookupExtractorFactoryContainerProvider lookupProvider)
   {
-    return baseComponentSupplier.getJacksonModules();
+    return baseComponentSupplier.createJoinableFactoryWrapper(lookupProvider);
   }
 
   @Override
-  public JoinableFactoryWrapper createJoinableFactoryWrapper(LookupExtractorFactoryContainerProvider lookupProvider)
+  public void finalizeTestFramework(SqlTestFramework sqlTestFramework)
   {
-    return baseComponentSupplier.createJoinableFactoryWrapper(lookupProvider);
+    baseComponentSupplier.finalizeTestFramework(sqlTestFramework);
   }
 
   @Override
@@ -618,11 +619,6 @@ public void finalizePlanner(PlannerFixture plannerFixture)
     basePlannerComponentSupplier.finalizePlanner(plannerFixture);
   }
 
-  @Override
-  public void configureGuice(DruidInjectorBuilder builder)
-  {
-  }
-
   public void assertQueryIsUnplannable(final String sql, String expectedError)
   {
     assertQueryIsUnplannable(PLANNER_CONFIG_DEFAULT, sql, expectedError);
@@ -839,49 +835,6 @@ protected QueryTestBuilder testBuilder()
 
   public class CalciteTestConfig implements QueryTestBuilder.QueryTestConfig
   {
-    @Override
-    public QueryTestRunner analyze(QueryTestBuilder builder)
-    {
-      if (builder.expectedResultsVerifier == null && builder.expectedResults != null) {
-        builder.expectedResultsVerifier = defaultResultsVerifier(
-            builder.expectedResults,
-            builder.expectedResultSignature
-        );
-      }
-      final List<QueryTestRunner.QueryRunStep> runSteps = new ArrayList<>();
-      final List<QueryTestRunner.QueryVerifyStep> verifySteps = new ArrayList<>();
-
-      // Historically, a test either prepares the query (to check resources), or
-      // runs the query (to check the native query and results.) In the future we
-      // may want to do both in a single test; but we have no such tests today.
-      if (builder.expectedResources != null) {
-        Preconditions.checkArgument(
-            builder.expectedResultsVerifier == null,
-            "Cannot check both results and resources"
-        );
-        QueryTestRunner.PrepareQuery execStep = new QueryTestRunner.PrepareQuery(builder);
-        runSteps.add(execStep);
-        verifySteps.add(new QueryTestRunner.VerifyResources(execStep));
-      } else {
-        QueryTestRunner.ExecuteQuery execStep = new QueryTestRunner.ExecuteQuery(builder);
-        runSteps.add(execStep);
-
-        // Verify native queries before results. (Note: change from prior pattern
-        // that reversed the steps.
-        if (builder.expectedQueries != null) {
-          verifySteps.add(new QueryTestRunner.VerifyNativeQueries(execStep));
-        }
-        if (builder.expectedResultsVerifier != null) {
-          verifySteps.add(new QueryTestRunner.VerifyResults(execStep));
-        }
-
-        // The exception is always verified: either there should be no exception
-        // (the other steps ran), or there should be the defined exception.
-        verifySteps.add(new QueryTestRunner.VerifyExpectedException(execStep));
-      }
-      return new QueryTestRunner(runSteps, verifySteps);
-    }
-
     @Override
     public QueryLogHook queryLogHook()
     {
@@ -897,7 +850,7 @@ public ExpectedException expectedException()
     @Override
     public PlannerFixture plannerFixture(PlannerConfig plannerConfig, AuthConfig authConfig)
     {
-      return queryFramework.plannerFixture(BaseCalciteQueryTest.this, plannerConfig, authConfig);
+      return queryFramework().plannerFixture(BaseCalciteQueryTest.this, plannerConfig, authConfig);
     }
 
     @Override
@@ -905,6 +858,18 @@ public ObjectMapper jsonMapper()
     {
       return queryFramework().queryJsonMapper();
     }
+
+    @Override
+    public ResultsVerifier defaultResultsVerifier(
+        List<Object[]> expectedResults,
+        RowSignature expectedResultSignature
+    )
+    {
+      return BaseCalciteQueryTest.this.defaultResultsVerifier(
+          expectedResults,
+          expectedResultSignature
+      );
+    }
   }
 
   public Set<ResourceAction> analyzeResources(
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteIngestionDmlTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteIngestionDmlTest.java
index 4df3e8e18d3f..68e83f9fe7e7 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteIngestionDmlTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteIngestionDmlTest.java
@@ -20,15 +20,21 @@
 package org.apache.druid.sql.calcite;
 
 import com.fasterxml.jackson.core.JsonProcessingException;
+import com.fasterxml.jackson.databind.Module;
 import com.fasterxml.jackson.databind.ObjectMapper;
+import com.fasterxml.jackson.databind.module.SimpleModule;
 import com.google.common.base.Preconditions;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
+import com.google.inject.Binder;
 import org.apache.druid.data.input.impl.CsvInputFormat;
 import org.apache.druid.data.input.impl.InlineInputSource;
+import org.apache.druid.guice.DruidInjectorBuilder;
+import org.apache.druid.initialization.DruidModule;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.StringUtils;
 import org.apache.druid.java.util.common.granularity.Granularity;
+import org.apache.druid.metadata.input.InputSourceModule;
 import org.apache.druid.query.Query;
 import org.apache.druid.query.QueryContexts;
 import org.apache.druid.query.aggregation.hyperloglog.HyperUniquesAggregatorFactory;
@@ -41,10 +47,15 @@
 import org.apache.druid.server.security.ResourceType;
 import org.apache.druid.sql.SqlQueryPlus;
 import org.apache.druid.sql.calcite.external.ExternalDataSource;
+import org.apache.druid.sql.calcite.external.ExternalOperatorConversion;
+import org.apache.druid.sql.calcite.external.HttpOperatorConversion;
+import org.apache.druid.sql.calcite.external.InlineOperatorConversion;
+import org.apache.druid.sql.calcite.external.LocalOperatorConversion;
 import org.apache.druid.sql.calcite.parser.DruidSqlInsert;
 import org.apache.druid.sql.calcite.planner.Calcites;
 import org.apache.druid.sql.calcite.planner.PlannerConfig;
 import org.apache.druid.sql.calcite.util.CalciteTests;
+import org.apache.druid.sql.guice.SqlBindings;
 import org.hamcrest.CoreMatchers;
 import org.hamcrest.Matcher;
 import org.hamcrest.MatcherAssert;
@@ -93,6 +104,58 @@ public CalciteIngestionDmlTest()
     super(IngestionTestSqlEngine.INSTANCE);
   }
 
+  @Override
+  public void configureGuice(DruidInjectorBuilder builder)
+  {
+    super.configureGuice(builder);
+
+    builder.addModule(new DruidModule() {
+
+      // Clone of MSQExternalDataSourceModule since it is not
+      // visible here.
+      @Override
+      public List<? extends Module> getJacksonModules()
+      {
+        return Collections.singletonList(
+            new SimpleModule(getClass().getSimpleName())
+                .registerSubtypes(ExternalDataSource.class)
+        );
+      }
+
+      @Override
+      public void configure(Binder binder)
+      {
+        // Nothing to do.
+      }
+    });
+
+    builder.addModule(new DruidModule() {
+
+      // Partial clone of MsqSqlModule, since that module is not
+      // visible to this one.
+
+      @Override
+      public List<? extends Module> getJacksonModules()
+      {
+        // We want this module to bring input sources along for the ride.
+        return new InputSourceModule().getJacksonModules();
+      }
+
+      @Override
+      public void configure(Binder binder)
+      {
+        // We want this module to bring InputSourceModule along for the ride.
+        binder.install(new InputSourceModule());
+
+        // Set up the EXTERN macro.
+        SqlBindings.addOperatorConversion(binder, ExternalOperatorConversion.class);
+        SqlBindings.addOperatorConversion(binder, HttpOperatorConversion.class);
+        SqlBindings.addOperatorConversion(binder, InlineOperatorConversion.class);
+        SqlBindings.addOperatorConversion(binder, LocalOperatorConversion.class);
+      }
+    });
+  }
+
   @After
   public void tearDown()
   {
@@ -147,6 +210,7 @@ public class IngestionDmlTester
     private List<ResourceAction> expectedResources;
     private Query<?> expectedQuery;
     private Matcher<Throwable> validationErrorMatcher;
+    private String expectedLogicalPlanResource;
 
     private IngestionDmlTester()
     {
@@ -224,6 +288,12 @@ public IngestionDmlTester expectValidationError(Class<? extends Throwable> clazz
       );
     }
 
+    public IngestionDmlTester expectLogicalPlanFrom(String resource)
+    {
+      this.expectedLogicalPlanResource = resource;
+      return this;
+    }
+
     public void verify()
     {
       if (didTest) {
@@ -299,6 +369,15 @@ private void verifySuccess()
           .expectedResources(expectedResources)
           .run();
 
+      String expectedLogicalPlan;
+      if (expectedLogicalPlanResource != null) {
+        expectedLogicalPlan = StringUtils.getResource(
+            this,
+            "/calcite/expected/ingest/" + expectedLogicalPlanResource + "-logicalPlan.txt"
+        );
+      } else {
+        expectedLogicalPlan = null;
+      }
       testBuilder()
           .sql(sql)
           .queryContext(queryContext)
@@ -306,6 +385,7 @@ private void verifySuccess()
           .plannerConfig(plannerConfig)
           .expectedQuery(expectedQuery)
           .expectedResults(Collections.singletonList(new Object[]{expectedTargetDataSource, expectedTargetSignature}))
+          .expectedLogicalPlan(expectedLogicalPlan)
           .run();
     }
 
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteInsertDmlTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteInsertDmlTest.java
index 965f66b423b2..9eb1194e14da 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteInsertDmlTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteInsertDmlTest.java
@@ -60,7 +60,7 @@
 
 public class CalciteInsertDmlTest extends CalciteIngestionDmlTest
 {
-  private static final Map<String, Object> PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT = ImmutableMap.of(
+  protected static final Map<String, Object> PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT = ImmutableMap.of(
       DruidSqlInsert.SQL_INSERT_SEGMENT_GRANULARITY,
       "{\"type\":\"all\"}"
   );
@@ -302,6 +302,7 @@ public void testInsertFromExternal()
                 .context(PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT)
                 .build()
         )
+        .expectLogicalPlanFrom("insertFromExternal")
         .verify();
   }
 
@@ -329,6 +330,7 @@ public void testInsertWithPartitionedBy()
                 .context(queryContextWithGranularity(Granularities.HOUR))
                 .build()
         )
+        .expectLogicalPlanFrom("insertWithPartitionedBy")
         .verify();
   }
 
@@ -423,6 +425,7 @@ public void testInsertWithClusteredBy()
                 .context(queryContextWithGranularity(Granularities.DAY))
                 .build()
         )
+        .expectLogicalPlanFrom("insertWithClusteredBy")
         .verify();
   }
 
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteNestedDataQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteNestedDataQueryTest.java
index 9b557ad0bfc3..af32ac68575c 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteNestedDataQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteNestedDataQueryTest.java
@@ -19,11 +19,10 @@
 
 package org.apache.druid.sql.calcite;
 
-import com.fasterxml.jackson.databind.Module;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Iterables;
+import com.google.inject.Injector;
 import org.apache.druid.common.config.NullHandling;
 import org.apache.druid.data.input.InputRow;
 import org.apache.druid.data.input.impl.DimensionSchema;
@@ -34,7 +33,7 @@
 import org.apache.druid.data.input.impl.StringDimensionSchema;
 import org.apache.druid.data.input.impl.TimeAndDimsParseSpec;
 import org.apache.druid.data.input.impl.TimestampSpec;
-import org.apache.druid.guice.ExpressionModule;
+import org.apache.druid.guice.DruidInjectorBuilder;
 import org.apache.druid.guice.NestedDataModule;
 import org.apache.druid.java.util.common.granularity.Granularities;
 import org.apache.druid.math.expr.ExprMacroTable;
@@ -45,7 +44,6 @@
 import org.apache.druid.query.aggregation.FilteredAggregatorFactory;
 import org.apache.druid.query.aggregation.LongSumAggregatorFactory;
 import org.apache.druid.query.dimension.DefaultDimensionSpec;
-import org.apache.druid.query.expression.LookupExprMacro;
 import org.apache.druid.query.filter.InDimFilter;
 import org.apache.druid.query.filter.LikeDimFilter;
 import org.apache.druid.query.groupby.GroupByQuery;
@@ -61,13 +59,11 @@
 import org.apache.druid.segment.incremental.IncrementalIndexSchema;
 import org.apache.druid.segment.join.JoinableFactoryWrapper;
 import org.apache.druid.segment.nested.NestedDataComplexTypeSerde;
-import org.apache.druid.segment.serde.ComplexMetrics;
 import org.apache.druid.segment.virtual.ExpressionVirtualColumn;
 import org.apache.druid.segment.virtual.NestedFieldVirtualColumn;
 import org.apache.druid.segment.writeout.OffHeapMemorySegmentWriteOutMediumFactory;
 import org.apache.druid.sql.calcite.filtration.Filtration;
 import org.apache.druid.sql.calcite.planner.UnsupportedSQLQueryException;
-import org.apache.druid.sql.calcite.util.CalciteTests;
 import org.apache.druid.sql.calcite.util.SpecificSegmentsQuerySegmentWalker;
 import org.apache.druid.sql.calcite.util.TestDataBuilder;
 import org.apache.druid.timeline.DataSegment;
@@ -75,7 +71,6 @@
 import org.junit.Test;
 
 import java.io.IOException;
-import java.util.ArrayList;
 import java.util.List;
 import java.util.Map;
 import java.util.stream.Collectors;
@@ -150,19 +145,18 @@ public class CalciteNestedDataQueryTest extends BaseCalciteQueryTest
       RAW_ROWS.stream().map(raw -> TestDataBuilder.createRow(raw, PARSER)).collect(Collectors.toList());
 
   @Override
-  public Iterable<? extends Module> getJacksonModules()
+  public void configureGuice(DruidInjectorBuilder builder)
   {
-    return Iterables.concat(
-        super.getJacksonModules(),
-        NestedDataModule.getJacksonModulesList()
-    );
+    super.configureGuice(builder);
+    builder.addModule(new NestedDataModule());
   }
 
   @SuppressWarnings("resource")
   @Override
   public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
       final QueryRunnerFactoryConglomerate conglomerate,
-      final JoinableFactoryWrapper joinableFactory
+      final JoinableFactoryWrapper joinableFactory,
+      final Injector injector
   ) throws IOException
   {
     NestedDataModule.registerHandlersAndSerde();
@@ -194,18 +188,6 @@ public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
     );
   }
 
-  @Override
-  public ExprMacroTable createMacroTable()
-  {
-    ComplexMetrics.registerSerde(NestedDataComplexTypeSerde.TYPE_NAME, NestedDataComplexTypeSerde.INSTANCE);
-    final List<ExprMacroTable.ExprMacro> exprMacros = new ArrayList<>();
-    for (Class<? extends ExprMacroTable.ExprMacro> clazz : ExpressionModule.EXPR_MACROS) {
-      exprMacros.add(CalciteTests.INJECTOR.getInstance(clazz));
-    }
-    exprMacros.add(CalciteTests.INJECTOR.getInstance(LookupExprMacro.class));
-    return new ExprMacroTable(exprMacros);
-  }
-
   @Test
   public void testGroupByPath()
   {
@@ -2428,7 +2410,7 @@ public void testCompositionTyping()
                           "v0",
                           "json_value(json_object('x',\"v1\"),'$.x', 'LONG')",
                           ColumnType.LONG,
-                          createMacroTable()
+                          queryFramework().macroTable()
                       ),
                       new NestedFieldVirtualColumn(
                           "nest",
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
index 516e363f9bb3..c9df143d9ca8 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteQueryTest.java
@@ -218,6 +218,7 @@ public void testInformationSchemaTables()
                      .add(new Object[]{"druid", CalciteTests.SOME_DATASOURCE, "TABLE", "NO", "NO"})
                      .add(new Object[]{"druid", CalciteTests.SOMEXDATASOURCE, "TABLE", "NO", "NO"})
                      .add(new Object[]{"druid", CalciteTests.USERVISITDATASOURCE, "TABLE", "NO", "NO"})
+                     .add(new Object[]{"druid", "wikipedia", "TABLE", "NO", "NO"})
                      .add(new Object[]{"INFORMATION_SCHEMA", "COLUMNS", "SYSTEM_TABLE", "NO", "NO"})
                      .add(new Object[]{"INFORMATION_SCHEMA", "SCHEMATA", "SYSTEM_TABLE", "NO", "NO"})
                      .add(new Object[]{"INFORMATION_SCHEMA", "TABLES", "SYSTEM_TABLE", "NO", "NO"})
@@ -254,6 +255,7 @@ public void testInformationSchemaTables()
                      .add(new Object[]{"druid", CalciteTests.SOME_DATASOURCE, "TABLE", "NO", "NO"})
                      .add(new Object[]{"druid", CalciteTests.SOMEXDATASOURCE, "TABLE", "NO", "NO"})
                      .add(new Object[]{"druid", CalciteTests.USERVISITDATASOURCE, "TABLE", "NO", "NO"})
+                     .add(new Object[]{"druid", "wikipedia", "TABLE", "NO", "NO"})
                      .add(new Object[]{"INFORMATION_SCHEMA", "COLUMNS", "SYSTEM_TABLE", "NO", "NO"})
                      .add(new Object[]{"INFORMATION_SCHEMA", "SCHEMATA", "SYSTEM_TABLE", "NO", "NO"})
                      .add(new Object[]{"INFORMATION_SCHEMA", "TABLES", "SYSTEM_TABLE", "NO", "NO"})
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java
new file mode 100644
index 000000000000..0a12eb8c88ea
--- /dev/null
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CalciteWindowQueryTest.java
@@ -0,0 +1,229 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite;
+
+import com.fasterxml.jackson.annotation.JsonProperty;
+import com.fasterxml.jackson.core.JsonProcessingException;
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.fasterxml.jackson.dataformat.yaml.YAMLFactory;
+import com.google.common.collect.ImmutableMap;
+import junitparams.JUnitParamsRunner;
+import junitparams.Parameters;
+import junitparams.naming.TestCaseName;
+import org.apache.druid.common.config.NullHandling;
+import org.apache.druid.jackson.DefaultObjectMapper;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.RE;
+import org.apache.druid.query.Query;
+import org.apache.druid.query.operator.OperatorFactory;
+import org.apache.druid.query.operator.WindowOperatorQuery;
+import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.column.RowSignature;
+import org.junit.AfterClass;
+import org.junit.Assert;
+import org.junit.Test;
+import org.junit.runner.RunWith;
+
+import java.io.File;
+import java.io.IOException;
+import java.net.URL;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Locale;
+import java.util.Objects;
+import java.util.concurrent.atomic.AtomicLong;
+import java.util.function.Function;
+import java.util.regex.Pattern;
+
+@RunWith(JUnitParamsRunner.class)
+public class CalciteWindowQueryTest extends BaseCalciteQueryTest
+{
+
+  public static final boolean DUMP_EXPECTED_RESULTS = Boolean.parseBoolean(
+      System.getProperty("druid.tests.sql.dumpExpectedResults")
+  );
+
+  static {
+    NullHandling.initializeForTests();
+  }
+
+  private static final ObjectMapper YAML_JACKSON = new DefaultObjectMapper(new YAMLFactory(), "tests");
+
+  private static final AtomicLong EXPECTED_TESTS = new AtomicLong();
+  private static final AtomicLong TEST_COUNTER = new AtomicLong();
+
+  public Object parametersForWindowQueryTest() throws Exception
+  {
+    final URL windowFolderUrl = ClassLoader.getSystemResource("calcite/tests/window");
+    File windowFolder = new File(windowFolderUrl.toURI());
+
+    final File[] listedFiles = windowFolder.listFiles(
+        pathname -> pathname.getName().toLowerCase(Locale.ROOT).endsWith(".sqltest")
+    );
+    EXPECTED_TESTS.set(listedFiles.length);
+
+    Pattern matcher = Pattern.compile(".*");
+
+    return Arrays
+        .stream(Objects.requireNonNull(listedFiles))
+        .map(File::getName)
+        .filter(matcher.asPredicate())
+        .toArray();
+  }
+
+  @AfterClass
+  public static void testRanAllTests()
+  {
+    // This validation exists to catch issues with the filter Pattern accidentally getting checked in.  It validates
+    // that we ran all of the tests from the directory.  If this is failing, most likely, the filter Pattern in
+    // parametersForWindowQueryTest accidentally got checked in as something other than ".*"
+    Assert.assertEquals(EXPECTED_TESTS.get(), TEST_COUNTER.get());
+  }
+
+  @Test
+  @Parameters(method = "parametersForWindowQueryTest")
+  @SuppressWarnings("unchecked")
+  @TestCaseName("{0}")
+  public void windowQueryTest(String filename) throws IOException
+  {
+    final Function<String, String> stringManipulator;
+    if (NullHandling.sqlCompatible()) {
+      stringManipulator = s -> "".equals(s) ? null : s;
+    } else {
+      stringManipulator = Function.identity();
+    }
+
+    TEST_COUNTER.incrementAndGet();
+    final URL systemResource = ClassLoader.getSystemResource("calcite/tests/window/" + filename);
+
+    final Object objectFromYaml = YAML_JACKSON.readValue(systemResource.openStream(), Object.class);
+
+    final ObjectMapper queryJackson = queryFramework().queryJsonMapper();
+    final WindowQueryTestInputClass input = queryJackson.convertValue(objectFromYaml, WindowQueryTestInputClass.class);
+
+    Function<Object, String> jacksonToString = value -> {
+      try {
+        return queryJackson.writeValueAsString(value);
+      }
+      catch (JsonProcessingException e) {
+        throw new RE(e);
+      }
+    };
+
+    if ("operatorValidation".equals(input.type)) {
+      testBuilder()
+          .skipVectorize(true)
+          .sql(input.sql)
+          .queryContext(ImmutableMap.of("windowsAreForClosers", true))
+          .addCustomVerification(QueryVerification.ofResults(results -> {
+            if (results.exception != null) {
+              throw new RE(results.exception, "Failed to execute because of exception.");
+            }
+
+            Assert.assertEquals(1, results.recordedQueries.size());
+
+            final WindowOperatorQuery query = (WindowOperatorQuery) results.recordedQueries.get(0);
+            for (int i = 0; i < input.expectedOperators.size(); ++i) {
+              final OperatorFactory expectedOperator = input.expectedOperators.get(i);
+              final OperatorFactory actualOperator = query.getOperators().get(i);
+              if (!expectedOperator.validateEquivalent(actualOperator)) {
+                // This assertion always fails because the validate equivalent failed, but we do it anyway
+                // so that we get values in the output of the failed test to make it easier to
+                // debug what happened.  Note, we use the Jackson representation when showing the diff.  There is
+                // a chance that this representation is exactly equivalent, but the validation call is still failing
+                // this is probably indicative of a bug where something that needs to be serialized by Jackson
+                // currently is not.  Check your getters.
+
+                // prepend different values so that we are guaranteed that it is always different
+                String expected = "e " + jacksonToString.apply(expectedOperator);
+                String actual = "a " + jacksonToString.apply(actualOperator);
+
+                Assert.assertEquals("Operator Mismatch, index[" + i + "]", expected, actual);
+              }
+            }
+            final RowSignature outputSignature = query.getRowSignature();
+            ColumnType[] types = new ColumnType[outputSignature.size()];
+            for (int i = 0; i < outputSignature.size(); ++i) {
+              types[i] = outputSignature.getColumnType(i).get();
+              Assert.assertEquals(types[i], results.signature.getColumnType(i).get());
+            }
+
+            maybeDumpExpectedResults(jacksonToString, results.results);
+            for (Object[] result : input.expectedResults) {
+              for (int i = 0; i < types.length; i++) {
+                // Jackson deserializes numbers as the minimum size required to store the value.  This means that
+                // Longs can become Integer objects and then they fail equality checks.  We read the expected
+                // results using Jackson, so, we coerce the expected results to the type expected.
+                if (result[i] != null) {
+                  if (result[i] instanceof Number) {
+                    switch (types[i].getType()) {
+                      case LONG:
+                        result[i] = ((Number) result[i]).longValue();
+                        break;
+                      case DOUBLE:
+                        result[i] = ((Number) result[i]).doubleValue();
+                        break;
+                      case FLOAT:
+                        result[i] = ((Number) result[i]).floatValue();
+                        break;
+                      default:
+                        throw new ISE("result[%s] was type[%s]!?  Expected it to be numerical", i, types[i].getType());
+                    }
+                  } else if (result[i] instanceof String) {
+                    result[i] = stringManipulator.apply((String) result[i]);
+                  }
+                }
+              }
+            }
+            assertResultsEquals(filename, input.expectedResults, results.results);
+          }))
+          .run();
+    }
+  }
+
+  private void maybeDumpExpectedResults(
+      Function<Object, String> toStrFn, List<Object[]> results
+  )
+  {
+    if (DUMP_EXPECTED_RESULTS) {
+      for (Object[] result : results) {
+        System.out.println("  - " + toStrFn.apply(result));
+      }
+    }
+  }
+
+  public static class WindowQueryTestInputClass
+  {
+    @JsonProperty
+    public String type;
+
+    @JsonProperty
+    public String sql;
+
+    @JsonProperty
+    public Query nativeQuery;
+
+    @JsonProperty
+    public List<OperatorFactory> expectedOperators;
+
+    @JsonProperty
+    public List<Object[]> expectedResults;
+  }
+}
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/CatalogIngestionTest.java b/sql/src/test/java/org/apache/druid/sql/calcite/CatalogIngestionTest.java
new file mode 100644
index 000000000000..44a7e5025a1b
--- /dev/null
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/CatalogIngestionTest.java
@@ -0,0 +1,327 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite;
+
+import com.fasterxml.jackson.core.JsonProcessingException;
+import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.collect.ImmutableList;
+import org.apache.druid.data.input.impl.CsvInputFormat;
+import org.apache.druid.data.input.impl.HttpInputSource;
+import org.apache.druid.data.input.impl.HttpInputSourceConfig;
+import org.apache.druid.data.input.impl.LocalInputSource;
+import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.java.util.common.StringUtils;
+import org.apache.druid.metadata.DefaultPasswordProvider;
+import org.apache.druid.segment.column.ColumnType;
+import org.apache.druid.segment.column.RowSignature;
+import org.apache.druid.sql.calcite.external.ExternalDataSource;
+import org.apache.druid.sql.calcite.external.ExternalOperatorConversion;
+import org.apache.druid.sql.calcite.filtration.Filtration;
+import org.apache.druid.sql.calcite.planner.Calcites;
+import org.apache.druid.sql.calcite.util.CalciteTests;
+import org.junit.Test;
+
+import java.io.File;
+import java.net.URI;
+import java.net.URISyntaxException;
+import java.util.Arrays;
+import java.util.Collections;
+
+/**
+ * Tests the input-source-specific table functions: http, inline and localfiles.
+ * Each of these use meta-metadata defined by the catalog to identify the allowed
+ * function arguments. The table functions work best with by-name argument syntax.
+ * <p>
+ * The tests first verify the baseline EXTERN form, then do the same ingest using
+ * the simpler functions. Verification against both the logical plan and native
+ * query ensure that the resulting MSQ task is identical regardless of the path
+ * taken.
+ */
+public class CatalogIngestionTest extends CalciteIngestionDmlTest
+{
+  protected static URI toURI(String uri)
+  {
+    try {
+      return new URI(uri);
+    }
+    catch (URISyntaxException e) {
+      throw new ISE("Bad URI: %s", uri);
+    }
+  }
+
+  protected final ExternalDataSource httpDataSource = new ExternalDataSource(
+      new HttpInputSource(
+          Collections.singletonList(toURI("http:foo.com/bar.csv")),
+          "bob",
+          new DefaultPasswordProvider("secret"),
+          new HttpInputSourceConfig(null)
+      ),
+      new CsvInputFormat(ImmutableList.of("x", "y", "z"), null, false, false, 0),
+      RowSignature.builder()
+                  .add("x", ColumnType.STRING)
+                  .add("y", ColumnType.STRING)
+                  .add("z", ColumnType.LONG)
+                  .build()
+  );
+
+  /**
+   * Basic use of EXTERN
+   */
+  @Test
+  public void testHttpExtern()
+  {
+    testIngestionQuery()
+        .sql("INSERT INTO dst SELECT * FROM %s PARTITIONED BY ALL TIME", externSql(httpDataSource))
+        .authentication(CalciteTests.SUPER_USER_AUTH_RESULT)
+        .expectTarget("dst", httpDataSource.getSignature())
+        .expectResources(dataSourceWrite("dst"), ExternalOperatorConversion.EXTERNAL_RESOURCE_ACTION)
+        .expectQuery(
+            newScanQueryBuilder()
+                .dataSource(httpDataSource)
+                .intervals(querySegmentSpec(Filtration.eternity()))
+                .columns("x", "y", "z")
+                .context(CalciteInsertDmlTest.PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT)
+                .build()
+        )
+        .expectLogicalPlanFrom("httpExtern")
+        .verify();
+  }
+
+  protected String externSqlByName(final ExternalDataSource externalDataSource)
+  {
+    ObjectMapper queryJsonMapper = queryFramework().queryJsonMapper();
+    try {
+      return StringUtils.format(
+          "TABLE(extern(inputSource => %s,\n" +
+          "             inputFormat => %s,\n" +
+          "             signature => %s))",
+          Calcites.escapeStringLiteral(queryJsonMapper.writeValueAsString(externalDataSource.getInputSource())),
+          Calcites.escapeStringLiteral(queryJsonMapper.writeValueAsString(externalDataSource.getInputFormat())),
+          Calcites.escapeStringLiteral(queryJsonMapper.writeValueAsString(externalDataSource.getSignature()))
+      );
+    }
+    catch (JsonProcessingException e) {
+      throw new RuntimeException(e);
+    }
+  }
+
+  /**
+   * EXTERN with parameters by name. Logical plan and native query are identical
+   * to the basic EXTERN.
+   */
+  @Test
+  public void testHttpExternByName()
+  {
+    testIngestionQuery()
+        .sql("INSERT INTO dst SELECT *\nFROM %s\nPARTITIONED BY ALL TIME", externSqlByName(httpDataSource))
+        .authentication(CalciteTests.SUPER_USER_AUTH_RESULT)
+        .expectTarget("dst", httpDataSource.getSignature())
+        .expectResources(dataSourceWrite("dst"), ExternalOperatorConversion.EXTERNAL_RESOURCE_ACTION)
+        .expectQuery(
+            newScanQueryBuilder()
+                .dataSource(httpDataSource)
+                .intervals(querySegmentSpec(Filtration.eternity()))
+                .columns("x", "y", "z")
+                .context(CalciteInsertDmlTest.PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT)
+                .build()
+        )
+        .expectLogicalPlanFrom("httpExtern")
+        .verify();
+  }
+
+  /**
+   * HTTP with parameters by name. Logical plan and native query are identical
+   * to the basic EXTERN.
+   */
+  @Test
+  public void testHttpFn()
+  {
+    testIngestionQuery()
+        .sql("INSERT INTO dst SELECT *\n" +
+             "FROM TABLE(http(userName => 'bob', password => 'secret',\n" +
+             "                uris => 'http:foo.com/bar.csv', format => 'csv'))\n" +
+             "     EXTEND (x VARCHAR, y VARCHAR, z BIGINT)\n" +
+             "PARTITIONED BY ALL TIME")
+        .authentication(CalciteTests.SUPER_USER_AUTH_RESULT)
+        .expectTarget("dst", httpDataSource.getSignature())
+        .expectResources(dataSourceWrite("dst"), ExternalOperatorConversion.EXTERNAL_RESOURCE_ACTION)
+        .expectQuery(
+            newScanQueryBuilder()
+                .dataSource(httpDataSource)
+                .intervals(querySegmentSpec(Filtration.eternity()))
+                .columns("x", "y", "z")
+                .context(CalciteInsertDmlTest.PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT)
+                .build()
+        )
+        .expectLogicalPlanFrom("httpExtern")
+        .verify();
+  }
+
+  /**
+   * Basic use of INLINE
+   */
+  @Test
+  public void testInlineExtern()
+  {
+    testIngestionQuery()
+        .sql("INSERT INTO dst SELECT * FROM %s PARTITIONED BY ALL TIME", externSql(externalDataSource))
+        .authentication(CalciteTests.SUPER_USER_AUTH_RESULT)
+        .expectTarget("dst", externalDataSource.getSignature())
+        .expectResources(dataSourceWrite("dst"), ExternalOperatorConversion.EXTERNAL_RESOURCE_ACTION)
+        .expectQuery(
+            newScanQueryBuilder()
+                .dataSource(externalDataSource)
+                .intervals(querySegmentSpec(Filtration.eternity()))
+                .columns("x", "y", "z")
+                .context(CalciteInsertDmlTest.PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT)
+                .build()
+        )
+        .expectLogicalPlanFrom("insertFromExternal")
+        .verify();
+  }
+
+  /**
+   * Inline with parameters by name. Logical plan and native query are identical
+   * to the basic EXTERN.
+   */
+  @Test
+  public void testInlineFn()
+  {
+    testIngestionQuery()
+        .sql("INSERT INTO dst SELECT *\n" +
+             "FROM TABLE(inline(data => 'a,b,1\nc,d,2\n',\n" +
+             "                  format => 'csv'))\n" +
+             "     EXTEND (x VARCHAR, y VARCHAR, z BIGINT)\n" +
+             "PARTITIONED BY ALL TIME")
+        .authentication(CalciteTests.SUPER_USER_AUTH_RESULT)
+        .expectTarget("dst", externalDataSource.getSignature())
+        .expectResources(dataSourceWrite("dst"), ExternalOperatorConversion.EXTERNAL_RESOURCE_ACTION)
+        .expectQuery(
+            newScanQueryBuilder()
+                .dataSource(externalDataSource)
+                .intervals(querySegmentSpec(Filtration.eternity()))
+                .columns("x", "y", "z")
+                .context(CalciteInsertDmlTest.PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT)
+                .build()
+        )
+        .expectLogicalPlanFrom("insertFromExternal")
+        .verify();
+  }
+
+  protected final ExternalDataSource localDataSource = new ExternalDataSource(
+      // The preferred form for this test. But, does not work.
+      // See Apache Druid issue #13359.
+      //new LocalInputSource(
+      //    new File("/tmp"),
+      //    "*.csv",
+      //    Arrays.asList(new File("foo.csv"), new File("bar.csv"))
+      //),
+      new LocalInputSource(
+          null,
+          null,
+          Arrays.asList(new File("/tmp/foo.csv"), new File("/tmp/bar.csv"))
+      ),
+      new CsvInputFormat(ImmutableList.of("x", "y", "z"), null, false, false, 0),
+      RowSignature.builder()
+                  .add("x", ColumnType.STRING)
+                  .add("y", ColumnType.STRING)
+                  .add("z", ColumnType.LONG)
+                  .build()
+  );
+
+  /**
+   * Basic use of LOCAL
+   */
+  @Test
+  public void testLocalExtern()
+  {
+    testIngestionQuery()
+        .sql("INSERT INTO dst SELECT * FROM %s PARTITIONED BY ALL TIME", externSql(localDataSource))
+        .authentication(CalciteTests.SUPER_USER_AUTH_RESULT)
+        .expectTarget("dst", localDataSource.getSignature())
+        .expectResources(dataSourceWrite("dst"), ExternalOperatorConversion.EXTERNAL_RESOURCE_ACTION)
+        .expectQuery(
+            newScanQueryBuilder()
+                .dataSource(localDataSource)
+                .intervals(querySegmentSpec(Filtration.eternity()))
+                .columns("x", "y", "z")
+                .context(CalciteInsertDmlTest.PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT)
+                .build()
+        )
+        .expectLogicalPlanFrom("localExtern")
+        .verify();
+  }
+
+  /**
+   * Local with parameters by name. Logical plan and native query are identical
+   * to the basic EXTERN.
+   */
+  @Test
+  public void testLocalFn()
+  {
+    testIngestionQuery()
+        .sql("INSERT INTO dst SELECT *\n" +
+             "FROM TABLE(localfiles(files => '/tmp/foo.csv, /tmp/bar.csv',\n" +
+             "                  format => 'csv'))\n" +
+             "     EXTEND (x VARCHAR, y VARCHAR, z BIGINT)\n" +
+             "PARTITIONED BY ALL TIME")
+        .authentication(CalciteTests.SUPER_USER_AUTH_RESULT)
+        .expectTarget("dst", localDataSource.getSignature())
+        .expectResources(dataSourceWrite("dst"), ExternalOperatorConversion.EXTERNAL_RESOURCE_ACTION)
+        .expectQuery(
+            newScanQueryBuilder()
+                .dataSource(localDataSource)
+                .intervals(querySegmentSpec(Filtration.eternity()))
+                .columns("x", "y", "z")
+                .context(CalciteInsertDmlTest.PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT)
+                .build()
+        )
+        .expectLogicalPlanFrom("localExtern")
+        .verify();
+  }
+
+  /**
+   * Local with parameters by name. Shows that the EXTERN keyword is optional.
+   * Logical plan and native query are identical to the basic EXTERN.
+   */
+  @Test
+  public void testLocalFnOmitExtend()
+  {
+    testIngestionQuery()
+        .sql("INSERT INTO dst SELECT *\n" +
+             "FROM TABLE(localfiles(files => '/tmp/foo.csv, /tmp/bar.csv',\n" +
+             "                  format => 'csv'))\n" +
+             "     (x VARCHAR, y VARCHAR, z BIGINT)\n" +
+             "PARTITIONED BY ALL TIME")
+        .authentication(CalciteTests.SUPER_USER_AUTH_RESULT)
+        .expectTarget("dst", localDataSource.getSignature())
+        .expectResources(dataSourceWrite("dst"), ExternalOperatorConversion.EXTERNAL_RESOURCE_ACTION)
+        .expectQuery(
+            newScanQueryBuilder()
+                .dataSource(localDataSource)
+                .intervals(querySegmentSpec(Filtration.eternity()))
+                .columns("x", "y", "z")
+                .context(CalciteInsertDmlTest.PARTITIONED_BY_ALL_TIME_QUERY_CONTEXT)
+                .build()
+        )
+        .expectLogicalPlanFrom("localExtern")
+        .verify();
+  }
+}
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestBuilder.java b/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestBuilder.java
index ef8050b6d54e..e0a9320002dd 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestBuilder.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestBuilder.java
@@ -25,6 +25,7 @@
 import org.apache.druid.server.security.AuthConfig;
 import org.apache.druid.server.security.AuthenticationResult;
 import org.apache.druid.server.security.ResourceAction;
+import org.apache.druid.sql.SqlStatementFactory;
 import org.apache.druid.sql.calcite.BaseCalciteQueryTest.ResultsVerifier;
 import org.apache.druid.sql.calcite.QueryTestRunner.QueryResults;
 import org.apache.druid.sql.calcite.planner.PlannerConfig;
@@ -36,7 +37,7 @@
 import org.junit.rules.ExpectedException;
 
 import javax.annotation.Nullable;
-
+import java.util.ArrayList;
 import java.util.Collections;
 import java.util.List;
 import java.util.Map;
@@ -61,17 +62,20 @@ public class QueryTestBuilder
 {
   /**
    * Implement to provide the execution framework that the tests require.
-   * The {@link #analyze(QueryTestBuilder)} method builds up the classes that
+   * The constructor builds up the classes that
    * will run the test, since some verification depends on context, such as that
    * provided by {@link BaseCalciteQueryTest}.
    */
   public interface QueryTestConfig
   {
-    QueryTestRunner analyze(QueryTestBuilder builder);
     QueryLogHook queryLogHook();
+
     ExpectedException expectedException();
+
     ObjectMapper jsonMapper();
+
     PlannerFixture plannerFixture(PlannerConfig plannerConfig, AuthConfig authConfig);
+    ResultsVerifier defaultResultsVerifier(List<Object[]> expectedResults, RowSignature expectedResultSignature);
   }
 
   protected final QueryTestConfig config;
@@ -82,14 +86,18 @@ public interface QueryTestConfig
   protected AuthenticationResult authenticationResult = CalciteTests.REGULAR_USER_AUTH_RESULT;
   protected List<Query<?>> expectedQueries;
   protected List<Object[]> expectedResults;
+  protected List<QueryTestRunner.QueryVerifyStepFactory> customVerifications = new ArrayList<>();
   protected RowSignature expectedResultSignature;
   protected List<ResourceAction> expectedResources;
   protected ResultsVerifier expectedResultsVerifier;
-  protected @Nullable Consumer<ExpectedException> expectedExceptionInitializer;
+  @Nullable
+  protected Consumer<ExpectedException> expectedExceptionInitializer;
   protected boolean skipVectorize;
   protected boolean queryCannotVectorize;
   protected AuthConfig authConfig = new AuthConfig();
   protected PlannerFixture plannerFixture;
+  protected String expectedLogicalPlan;
+  protected SqlSchema expectedSqlSchema;
 
   public QueryTestBuilder(final QueryTestConfig config)
   {
@@ -148,6 +156,23 @@ public QueryTestBuilder expectedResults(
     return this;
   }
 
+  public QueryTestBuilder addCustomVerification(
+      QueryTestRunner.QueryVerifyStepFactory factory
+  )
+  {
+    this.customVerifications.add(factory);
+    return this;
+  }
+
+  public QueryTestBuilder setCustomVerifications(
+      List<QueryTestRunner.QueryVerifyStepFactory> factories
+  )
+  {
+    this.customVerifications = new ArrayList<>();
+    this.customVerifications.addAll(factories);
+    return this;
+  }
+
   public QueryTestBuilder expectedSignature(
       final RowSignature expectedResultSignature
   )
@@ -215,23 +240,35 @@ public QueryTestBuilder plannerFixture(PlannerFixture plannerFixture)
     return this;
   }
 
+  public QueryTestBuilder expectedLogicalPlan(String expectedLogicalPlan)
+  {
+    this.expectedLogicalPlan = expectedLogicalPlan;
+    return this;
+  }
+
+  public QueryTestBuilder expectedSqlSchema(SqlSchema querySchema)
+  {
+    this.expectedSqlSchema = querySchema;
+    return this;
+  }
+
   public QueryTestRunner build()
   {
-    return config.analyze(this);
+    return new QueryTestRunner(this);
   }
 
   /**
-   * Internal method to return the cached planner config, or create a new one
+   * Internal method to return the cached statement factory, or create a new one
    * based on the configs provided. Note: does not cache the newly created
    * config: doing so would confuse the "please use mine" vs. "create a new
    * one each time" semantics.
    */
-  protected PlannerFixture plannerFixture()
+  protected SqlStatementFactory statementFactory()
   {
     if (plannerFixture != null) {
-      return plannerFixture;
+      return plannerFixture.statementFactory();
     } else {
-      return config.plannerFixture(plannerConfig, authConfig);
+      return config.plannerFixture(plannerConfig, authConfig).statementFactory();
     }
   }
 
@@ -244,4 +281,5 @@ public QueryResults results()
   {
     return build().resultsOnly();
   }
+
 }
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestRunner.java b/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestRunner.java
index fc60bc4c61aa..8b64f7a429bc 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestRunner.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/QueryTestRunner.java
@@ -21,8 +21,13 @@
 
 import com.fasterxml.jackson.core.JsonProcessingException;
 import com.fasterxml.jackson.databind.ObjectMapper;
+import com.google.common.base.Preconditions;
 import com.google.common.collect.ImmutableSet;
+import org.apache.calcite.plan.RelOptUtil;
 import org.apache.calcite.rel.type.RelDataType;
+import org.apache.calcite.sql.SqlExplainFormat;
+import org.apache.calcite.sql.SqlExplainLevel;
+import org.apache.calcite.sql.SqlInsert;
 import org.apache.druid.java.util.common.ISE;
 import org.apache.druid.java.util.common.Pair;
 import org.apache.druid.java.util.common.StringUtils;
@@ -35,6 +40,10 @@
 import org.apache.druid.sql.PreparedStatement;
 import org.apache.druid.sql.SqlQueryPlus;
 import org.apache.druid.sql.SqlStatementFactory;
+import org.apache.druid.sql.calcite.QueryTestBuilder.QueryTestConfig;
+import org.apache.druid.sql.calcite.parser.DruidSqlIngest;
+import org.apache.druid.sql.calcite.planner.PlannerCaptureHook;
+import org.apache.druid.sql.calcite.planner.PrepareResult;
 import org.apache.druid.sql.calcite.table.RowSignatures;
 import org.apache.druid.sql.calcite.util.QueryLogHook;
 import org.junit.Assert;
@@ -48,7 +57,7 @@
 import java.util.Set;
 
 /**
- * Runs a test build up by {@link QueryTestBuilder}. Running a SQL query test
+ * Runs a test built up by {@link QueryTestBuilder}. Running a SQL query test
  * is somewhat complex; with different modes and items to verify. To manage the
  * complexity, test execution is done in two steps:
  * <ol>
@@ -60,6 +69,11 @@
  */
 public class QueryTestRunner
 {
+  public interface QueryVerifyStepFactory
+  {
+    QueryVerifyStep make(ExecuteQuery execStep);
+  }
+
   /**
    * Test step that executes or prepares a query.
    */
@@ -95,27 +109,32 @@ public static class QueryResults
   {
     public final Map<String, Object> queryContext;
     public final String vectorizeOption;
+    public final RelDataType sqlSignature;
     public final RowSignature signature;
     public final List<Object[]> results;
     public final List<Query<?>> recordedQueries;
     public final Set<ResourceAction> resourceActions;
     public final RuntimeException exception;
+    public final PlannerCaptureHook capture;
 
     public QueryResults(
         final Map<String, Object> queryContext,
         final String vectorizeOption,
-        final RowSignature signature,
+        final RelDataType sqlSignature,
         final List<Object[]> results,
-        final List<Query<?>> recordedQueries
+        final List<Query<?>> recordedQueries,
+        final PlannerCaptureHook capture
     )
     {
       this.queryContext = queryContext;
       this.vectorizeOption = vectorizeOption;
-      this.signature = signature;
+      this.sqlSignature = sqlSignature;
+      this.signature = RowSignatures.fromRelDataType(sqlSignature.getFieldNames(), sqlSignature);
       this.results = results;
       this.recordedQueries = recordedQueries;
       this.resourceActions = null;
       this.exception = null;
+      this.capture = capture;
     }
 
     public QueryResults(
@@ -131,21 +150,8 @@ public QueryResults(
       this.recordedQueries = null;
       this.resourceActions = null;
       this.exception = exception;
-    }
-
-    public QueryResults(
-        final Map<String, Object> queryContext,
-        final String vectorizeOption,
-        final Set<ResourceAction> resourceActions
-    )
-    {
-      this.queryContext = queryContext;
-      this.vectorizeOption = vectorizeOption;
-      this.signature = null;
-      this.results = null;
-      this.recordedQueries = null;
-      this.resourceActions = resourceActions;
-      this.exception = null;
+      this.capture = null;
+      this.sqlSignature = null;
     }
   }
 
@@ -156,7 +162,8 @@ public QueryResults(
    */
   public static class PrepareQuery extends QueryRunStep
   {
-    private Set<ResourceAction> resourceActions;
+    public Set<ResourceAction> resourceActions;
+    public RelDataType sqlSignature;
 
     public PrepareQuery(QueryTestBuilder builder)
     {
@@ -177,10 +184,11 @@ public void run()
           .sqlParameters(builder.parameters)
           .auth(builder.authenticationResult)
           .build();
-      final SqlStatementFactory sqlStatementFactory = builder.plannerFixture().statementFactory();
+      final SqlStatementFactory sqlStatementFactory = builder.statementFactory();
       final PreparedStatement stmt = sqlStatementFactory.preparedStatement(sqlQuery);
-      stmt.prepare();
+      final PrepareResult prepareResult = stmt.prepare();
       resourceActions = stmt.allResources();
+      sqlSignature = prepareResult.getReturnedRowType();
     }
   }
 
@@ -191,10 +199,12 @@ public void run()
   public static class ExecuteQuery extends QueryRunStep
   {
     private final List<QueryResults> results = new ArrayList<>();
+    private final boolean doCapture;
 
     public ExecuteQuery(QueryTestBuilder builder)
     {
       super(builder);
+      doCapture = builder.expectedLogicalPlan != null;
     }
 
     public List<QueryResults> results()
@@ -209,7 +219,7 @@ public void run()
 
       BaseCalciteQueryTest.log.info("SQL: %s", builder.sql);
 
-      final SqlStatementFactory sqlStatementFactory = builder.plannerFixture().statementFactory();
+      final SqlStatementFactory sqlStatementFactory = builder.statementFactory();
       final SqlQueryPlus sqlQuery = SqlQueryPlus.builder(builder.sql)
           .sqlParameters(builder.parameters)
           .auth(builder.authenticationResult)
@@ -233,25 +243,40 @@ public void run()
           theQueryContext.put(QueryContexts.VECTOR_SIZE_KEY, 2); // Small vector size to ensure we use more than one.
         }
 
-        try {
-          final Pair<RowSignature, List<Object[]>> plannerResults = getResults(
-              sqlStatementFactory,
-              sqlQuery.withContext(theQueryContext));
-          results.add(new QueryResults(
-              theQueryContext,
-              vectorize,
-              plannerResults.lhs,
-              plannerResults.rhs,
-              queryLogHook.getRecordedQueries()
-          ));
-        }
-        catch (RuntimeException e) {
-          results.add(new QueryResults(
-              theQueryContext,
-              vectorize,
-              e
-          ));
-        }
+        results.add(runQuery(
+            sqlStatementFactory,
+            sqlQuery.withContext(theQueryContext),
+            vectorize
+        ));
+      }
+    }
+
+    public QueryResults runQuery(
+        final SqlStatementFactory sqlStatementFactory,
+        final SqlQueryPlus query,
+        final String vectorize
+    )
+    {
+      try {
+        final PlannerCaptureHook capture = doCapture ? new PlannerCaptureHook() : null;
+        final DirectStatement stmt = sqlStatementFactory.directStatement(query);
+        stmt.setHook(capture);
+        final Sequence<Object[]> results = stmt.execute().getResults();
+        return new QueryResults(
+            query.context(),
+            vectorize,
+            stmt.prepareResult().getReturnedRowType(),
+            results.toList(),
+            builder().config.queryLogHook().getRecordedQueries(),
+            capture
+        );
+      }
+      catch (RuntimeException e) {
+        return new QueryResults(
+            query.context(),
+            vectorize,
+            e
+        );
       }
     }
 
@@ -271,26 +296,15 @@ public static Pair<RowSignature, List<Object[]>> getResults(
   }
 
   /**
-   * Base class for steps which validate query execution results.
+   * Verify query results.
    */
-  public abstract static class VerifyExecStep implements QueryVerifyStep
+  public static class VerifyResults implements QueryVerifyStep
   {
     protected final ExecuteQuery execStep;
 
-    public VerifyExecStep(ExecuteQuery execStep)
-    {
-      this.execStep = execStep;
-    }
-  }
-
-  /**
-   * Verify query results.
-   */
-  public static class VerifyResults extends VerifyExecStep
-  {
     public VerifyResults(ExecuteQuery execStep)
     {
-      super(execStep);
+      this.execStep = execStep;
     }
 
     @Override
@@ -321,11 +335,13 @@ private void verifyResults(QueryResults queryResults)
    * Verify the native queries generated by an execution run against a set
    * provided in the builder.
    */
-  public static class VerifyNativeQueries extends VerifyExecStep
+  public static class VerifyNativeQueries implements QueryVerifyStep
   {
+    protected final ExecuteQuery execStep;
+
     public VerifyNativeQueries(ExecuteQuery execStep)
     {
-      super(execStep);
+      this.execStep = execStep;
     }
 
     @Override
@@ -344,6 +360,17 @@ private void verifyQuery(QueryResults queryResults)
       QueryTestBuilder builder = execStep.builder();
       final List<Query<?>> expectedQueries = new ArrayList<>();
       for (Query<?> query : builder.expectedQueries) {
+        // The tests set a lot of various values in the context that are not relevant to how the query actually planned,
+        // so we effectively ignore these keys in the context during query validation by overwriting whatever
+        // context had been set in the test with the context produced by the test setup code.  This means that any
+        // context parameter that the tests choose to set will never actually be tested (it will always be overridden)
+        // while parameters that don't get set by the test can be tested.
+        //
+        // This is pretty magical, it would probably be a good thing to move away from this hard-to-predict setting
+        // of context parameters towards a test setup that is much more explicit and easier to understand.  Perhaps
+        // we could have validations of query objects that are a bit more intelligent.  That is, instead of relying on
+        // equals, perhaps we could have a context validator that only validates that keys set on the expected query
+        // are set, allowing any other context keys to also be set?
         expectedQueries.add(BaseCalciteQueryTest.recursivelyOverrideContext(query, queryResults.queryContext));
       }
 
@@ -379,7 +406,7 @@ private void verifyQuery(QueryResults queryResults)
   }
 
   /**
-   * Verify rsources for a prepared query against the expected list.
+   * Verify resources for a prepared query against the expected list.
    */
   public static class VerifyResources implements QueryVerifyStep
   {
@@ -402,7 +429,106 @@ public void verify()
   }
 
   /**
-   * Verify the exception thrown by a query using a jUnit expected
+   * Verify resources for a prepared query against the expected list.
+   */
+  public static class VerifyPrepareSignature implements QueryVerifyStep
+  {
+    private final PrepareQuery prepareStep;
+
+    public VerifyPrepareSignature(PrepareQuery prepareStep)
+    {
+      this.prepareStep = prepareStep;
+    }
+
+    @Override
+    public void verify()
+    {
+      QueryTestBuilder builder = prepareStep.builder();
+      Assert.assertEquals(
+          builder.expectedSqlSchema,
+          SqlSchema.of(prepareStep.sqlSignature)
+      );
+    }
+  }
+
+  /**
+   * Verify resources for a prepared query against the expected list.
+   */
+  public static class VerifyExecuteSignature implements QueryVerifyStep
+  {
+    private final ExecuteQuery execStep;
+
+    public VerifyExecuteSignature(ExecuteQuery execStep)
+    {
+      this.execStep = execStep;
+    }
+
+    @Override
+    public void verify()
+    {
+      QueryTestBuilder builder = execStep.builder();
+      for (QueryResults queryResults : execStep.results()) {
+        Assert.assertEquals(
+            builder.expectedSqlSchema,
+            SqlSchema.of(queryResults.sqlSignature)
+        );
+      }
+    }
+  }
+
+  public static class VerifyLogicalPlan implements QueryVerifyStep
+  {
+    private final ExecuteQuery execStep;
+
+    public VerifyLogicalPlan(ExecuteQuery execStep)
+    {
+      this.execStep = execStep;
+    }
+
+    @Override
+    public void verify()
+    {
+      for (QueryResults queryResults : execStep.results()) {
+        verifyLogicalPlan(queryResults);
+      }
+    }
+
+    private void verifyLogicalPlan(QueryResults queryResults)
+    {
+      String expectedPlan = execStep.builder().expectedLogicalPlan;
+      String actualPlan = visualizePlan(queryResults.capture);
+      Assert.assertEquals(expectedPlan, actualPlan);
+    }
+
+    private String visualizePlan(PlannerCaptureHook hook)
+    {
+      // Do-it-ourselves plan since the actual plan omits insert.
+      String queryPlan = RelOptUtil.dumpPlan(
+          "",
+          hook.relRoot().rel,
+          SqlExplainFormat.TEXT,
+          SqlExplainLevel.DIGEST_ATTRIBUTES);
+      String plan;
+      SqlInsert insertNode = hook.insertNode();
+      if (insertNode == null) {
+        plan = queryPlan;
+      } else {
+        DruidSqlIngest druidInsertNode = (DruidSqlIngest) insertNode;
+        // The target is a SQLIdentifier literal, pre-resolution, so does
+        // not include the schema.
+        plan = StringUtils.format(
+            "LogicalInsert(target=[%s], partitionedBy=[%s], clusteredBy=[%s])\n",
+            druidInsertNode.getTargetTable(),
+            druidInsertNode.getPartitionedBy() == null ? "<none>" : druidInsertNode.getPartitionedBy(),
+            druidInsertNode.getClusteredBy() == null ? "<none>" : druidInsertNode.getClusteredBy()
+        ) + "  " + StringUtils.replace(queryPlan, "\n ", "\n   ");
+      }
+      return plan;
+    }
+  }
+
+  /**
+   * Verify the exception thrown by a query using a JUnit expected
    * exception. This is actually an awkward way to to the job, but it is
    * what the Calcite queries have long used. There are three modes.
    * In the first, the exception is simply thrown and the expected
@@ -416,11 +542,13 @@ public void verify()
    * after the first failure. It would be better to check all three
    * runs, but that's an exercise for later.
    */
-  public static class VerifyExpectedException extends VerifyExecStep
+  public static class VerifyExpectedException implements QueryVerifyStep
   {
+    protected final ExecuteQuery execStep;
+
     public VerifyExpectedException(ExecuteQuery execStep)
     {
-      super(execStep);
+      this.execStep = execStep;
     }
 
     @Override
@@ -455,16 +583,68 @@ public void verify()
     }
   }
 
-  private final List<QueryTestRunner.QueryRunStep> runSteps;
-  private final List<QueryTestRunner.QueryVerifyStep> verifySteps;
+  private final List<QueryTestRunner.QueryRunStep> runSteps = new ArrayList<>();
+  private final List<QueryTestRunner.QueryVerifyStep> verifySteps = new ArrayList<>();
 
-  QueryTestRunner(
-      final List<QueryTestRunner.QueryRunStep> runSteps,
-      final List<QueryTestRunner.QueryVerifyStep> verifySteps
-  )
+  /**
+   * Create a test runner based on the options set in the builder.
+   */
+  public QueryTestRunner(QueryTestBuilder builder)
   {
-    this.runSteps = runSteps;
-    this.verifySteps = verifySteps;
+    QueryTestConfig config = builder.config;
+    if (builder.expectedResultsVerifier == null && builder.expectedResults != null) {
+      builder.expectedResultsVerifier = config.defaultResultsVerifier(
+          builder.expectedResults,
+          builder.expectedResultSignature
+      );
+    }
+
+    // Historically, a test either prepares the query (to check resources), or
+    // runs the query (to check the native query and results.) In the future we
+    // may want to do both in a single test; but we have no such tests today.
+    if (builder.expectedResources != null) {
+      Preconditions.checkArgument(
+          builder.expectedResultsVerifier == null,
+          "Cannot check both results and resources"
+      );
+      QueryTestRunner.PrepareQuery execStep = new QueryTestRunner.PrepareQuery(builder);
+      runSteps.add(execStep);
+      verifySteps.add(new QueryTestRunner.VerifyResources(execStep));
+      if (builder.expectedSqlSchema != null) {
+        verifySteps.add(new VerifyPrepareSignature(execStep));
+      }
+    } else {
+      QueryTestRunner.ExecuteQuery execStep = new QueryTestRunner.ExecuteQuery(builder);
+      runSteps.add(execStep);
+
+      // Verify the logical plan, if requested.
+      if (builder.expectedLogicalPlan != null) {
+        verifySteps.add(new QueryTestRunner.VerifyLogicalPlan(execStep));
+      }
+
+      if (builder.expectedSqlSchema != null) {
+        verifySteps.add(new VerifyExecuteSignature(execStep));
+      }
+
+      // Verify native queries before results. (Note: change from prior pattern
+      // that reversed the steps.
+      if (builder.expectedQueries != null) {
+        verifySteps.add(new QueryTestRunner.VerifyNativeQueries(execStep));
+      }
+      if (builder.expectedResultsVerifier != null) {
+        verifySteps.add(new QueryTestRunner.VerifyResults(execStep));
+      }
+
+      if (!builder.customVerifications.isEmpty()) {
+        for (QueryTestRunner.QueryVerifyStepFactory customVerification : builder.customVerifications) {
+          verifySteps.add(customVerification.make(execStep));
+        }
+      }
+
+      // The exception is always verified: either there should be no exception
+      // (the other steps ran), or there should be the defined exception.
+      verifySteps.add(new QueryTestRunner.VerifyExpectedException(execStep));
+    }
   }
 
   /**
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/QueryVerification.java b/sql/src/test/java/org/apache/druid/sql/calcite/QueryVerification.java
new file mode 100644
index 000000000000..ba57e603b372
--- /dev/null
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/QueryVerification.java
@@ -0,0 +1,55 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite;
+
+public class QueryVerification
+{
+  public static QueryResultsVerifierFactory ofResults(QueryResultsVerifier verifier)
+  {
+    return new QueryResultsVerifierFactory(verifier);
+  }
+
+  public interface QueryResultsVerifier
+  {
+    void verifyResults(QueryTestRunner.QueryResults results);
+  }
+
+  public static class QueryResultsVerifierFactory implements QueryTestRunner.QueryVerifyStepFactory
+  {
+    private final QueryResultsVerifier verifier;
+
+    public QueryResultsVerifierFactory(
+        QueryResultsVerifier verifier
+    )
+    {
+      this.verifier = verifier;
+    }
+
+    @Override
+    public QueryTestRunner.QueryVerifyStep make(QueryTestRunner.ExecuteQuery execStep)
+    {
+      return () -> {
+        for (QueryTestRunner.QueryResults queryResults : execStep.results()) {
+          verifier.verifyResults(queryResults);
+        }
+      };
+    }
+  }
+}
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/SqlSchema.java b/sql/src/test/java/org/apache/druid/sql/calcite/SqlSchema.java
new file mode 100644
index 000000000000..b5ee0c1198ba
--- /dev/null
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/SqlSchema.java
@@ -0,0 +1,145 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite;
+
+import org.apache.calcite.rel.type.RelDataType;
+import org.apache.calcite.rel.type.RelDataTypeField;
+import org.apache.druid.java.util.common.StringUtils;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Objects;
+import java.util.stream.Collectors;
+
+/**
+ * Simple representation of an SQL schema used to validate the row type of
+ * a SQL query against the SQL types. See {@code RowSignature} when the goal
+ * is to validate the Druid native signature.
+ */
+public class SqlSchema
+{
+  public static class ColumnSignature
+  {
+    private final String name;
+    private final String type;
+
+    public ColumnSignature(final String name, final String type)
+    {
+      this.name = name;
+      this.type = type;
+    }
+
+    public String name()
+    {
+      return name;
+    }
+
+    public String type()
+    {
+      return type;
+    }
+
+    @Override
+    public String toString()
+    {
+      return StringUtils.format("%s %s", name, type);
+    }
+
+    @Override
+    public boolean equals(Object o)
+    {
+      if (o == null || o.getClass() != getClass()) {
+        return false;
+      }
+      ColumnSignature other = (ColumnSignature) o;
+      return Objects.equals(name, other.name)
+          && Objects.equals(type, other.type);
+    }
+
+    @Override
+    public int hashCode()
+    {
+      return Objects.hash(name, type);
+    }
+  }
+
+  public static class Builder
+  {
+    private final List<ColumnSignature> columns = new ArrayList<>();
+
+    public Builder column(String name, String type)
+    {
+      columns.add(new ColumnSignature(name, type));
+      return this;
+    }
+
+    public SqlSchema build()
+    {
+      return new SqlSchema(columns);
+    }
+  }
+
+  private final List<ColumnSignature> columns;
+
+  public SqlSchema(final List<ColumnSignature> columns)
+  {
+    this.columns = columns;
+  }
+
+  public static Builder builder()
+  {
+    return new Builder();
+  }
+
+  public static SqlSchema of(RelDataType rowType)
+  {
+    final Builder builder = new Builder();
+    List<RelDataTypeField> fields = rowType.getFieldList();
+    for (RelDataTypeField field : fields) {
+      builder.column(field.getName(), field.getType().getFullTypeString());
+    }
+    return builder.build();
+  }
+
+  @Override
+  public String toString()
+  {
+    return "(" +
+        columns.stream().map(
+            c -> c.toString()).collect(Collectors.joining(", ")) +
+        ")";
+  }
+
+  @Override
+  public boolean equals(Object o)
+  {
+    if (o == null || o.getClass() != getClass()) {
+      return false;
+    }
+    final SqlSchema other = (SqlSchema) o;
+    return Objects.equals(columns, other.columns);
+  }
+
+  @Override
+  public int hashCode()
+  {
+    return Objects.hash(columns);
+  }
+}
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/util/BasicTestModule.java b/sql/src/test/java/org/apache/druid/sql/calcite/util/BasicTestModule.java
new file mode 100644
index 000000000000..375352e22c79
--- /dev/null
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/util/BasicTestModule.java
@@ -0,0 +1,65 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.sql.calcite.util;
+
+import com.fasterxml.jackson.databind.Module;
+import com.google.common.collect.ImmutableMap;
+import com.google.inject.Binder;
+import org.apache.druid.guice.ExpressionModule;
+import org.apache.druid.initialization.DruidModule;
+import org.apache.druid.query.expression.LookupEnabledTestExprMacroTable;
+import org.apache.druid.query.expression.LookupExprMacro;
+import org.apache.druid.query.lookup.LookupExtractorFactoryContainerProvider;
+import org.apache.druid.query.lookup.LookupSerdeModule;
+import org.apache.druid.sql.calcite.expression.builtin.QueryLookupOperatorConversion;
+import org.apache.druid.sql.guice.SqlBindings;
+import org.apache.druid.timeline.DataSegment;
+
+import java.util.List;
+
+class BasicTestModule implements DruidModule
+{
+  @Override
+  public void configure(Binder binder)
+  {
+    final LookupExtractorFactoryContainerProvider lookupProvider =
+        LookupEnabledTestExprMacroTable.createTestLookupProvider(
+            ImmutableMap.of(
+                "a", "xa",
+                "abc", "xabc",
+                "nosuchkey", "mysteryvalue",
+                "6", "x6"
+            )
+        );
+
+    binder.bind(DataSegment.PruneSpecsHolder.class).toInstance(DataSegment.PruneSpecsHolder.DEFAULT);
+
+    // This Module is just to get a LookupExtractorFactoryContainerProvider with a usable "lookyloo" lookup.
+    binder.bind(LookupExtractorFactoryContainerProvider.class).toInstance(lookupProvider);
+    SqlBindings.addOperatorConversion(binder, QueryLookupOperatorConversion.class);
+    ExpressionModule.addExprMacro(binder, LookupExprMacro.class);
+  }
+
+  @Override
+  public List<? extends Module> getJacksonModules()
+  {
+    return new LookupSerdeModule().getJacksonModules();
+  }
+}
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/util/CalciteTestInjectorBuilder.java b/sql/src/test/java/org/apache/druid/sql/calcite/util/CalciteTestInjectorBuilder.java
index 902c61ddb44a..f9e723e36311 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/util/CalciteTestInjectorBuilder.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/util/CalciteTestInjectorBuilder.java
@@ -19,25 +19,12 @@
 
 package org.apache.druid.sql.calcite.util;
 
-import com.fasterxml.jackson.databind.Module;
-import com.google.common.collect.ImmutableMap;
-import com.google.inject.Binder;
 import com.google.inject.Injector;
 import org.apache.druid.guice.StartupInjectorBuilder;
 import org.apache.druid.initialization.CoreInjectorBuilder;
-import org.apache.druid.initialization.DruidModule;
 import org.apache.druid.math.expr.ExprMacroTable;
-import org.apache.druid.query.expression.LookupEnabledTestExprMacroTable;
 import org.apache.druid.query.expression.TestExprMacroTable;
-import org.apache.druid.query.lookup.LookupExtractorFactoryContainerProvider;
-import org.apache.druid.query.lookup.LookupSerdeModule;
 import org.apache.druid.sql.calcite.aggregation.SqlAggregationModule;
-import org.apache.druid.sql.calcite.expression.builtin.QueryLookupOperatorConversion;
-import org.apache.druid.sql.calcite.external.ExternalOperatorConversion;
-import org.apache.druid.sql.guice.SqlBindings;
-import org.apache.druid.timeline.DataSegment;
-
-import java.util.List;
 
 /**
  * Create the injector used for {@link CalciteTests#INJECTOR}, but in a way
@@ -77,37 +64,4 @@ public Injector build()
       throw e;
     }
   }
-
-  private static class BasicTestModule implements DruidModule
-  {
-    @Override
-    public void configure(Binder binder)
-    {
-      final LookupExtractorFactoryContainerProvider lookupProvider =
-          LookupEnabledTestExprMacroTable.createTestLookupProvider(
-              ImmutableMap.of(
-                  "a", "xa",
-                  "abc", "xabc",
-                  "nosuchkey", "mysteryvalue",
-                  "6", "x6"
-              )
-          );
-
-      binder.bind(DataSegment.PruneSpecsHolder.class).toInstance(DataSegment.PruneSpecsHolder.DEFAULT);
-      binder.bind(LookupExtractorFactoryContainerProvider.class).toInstance(lookupProvider);
-
-      // This Module is just to get a LookupExtractorFactoryContainerProvider with a usable "lookyloo" lookup.
-      binder.bind(LookupExtractorFactoryContainerProvider.class).toInstance(lookupProvider);
-      SqlBindings.addOperatorConversion(binder, QueryLookupOperatorConversion.class);
-
-      // Add "EXTERN" table macro, for CalciteInsertDmlTest.
-      SqlBindings.addOperatorConversion(binder, ExternalOperatorConversion.class);
-    }
-
-    @Override
-    public List<? extends Module> getJacksonModules()
-    {
-      return new LookupSerdeModule().getJacksonModules();
-    }
-  }
 }
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/util/QueryFrameworkUtils.java b/sql/src/test/java/org/apache/druid/sql/calcite/util/QueryFrameworkUtils.java
index f019c37b62cd..495f8a912b3f 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/util/QueryFrameworkUtils.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/util/QueryFrameworkUtils.java
@@ -127,6 +127,7 @@ public static SqlStatementFactory createSqlStatementFactory(
     );
     return new SqlStatementFactory(toolbox);
   }
+
   public static DruidSchemaCatalog createMockRootSchema(
       final Injector injector,
       final QueryRunnerFactoryConglomerate conglomerate,
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/util/QueryLogHook.java b/sql/src/test/java/org/apache/druid/sql/calcite/util/QueryLogHook.java
index 7a58503717a9..967926681fb2 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/util/QueryLogHook.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/util/QueryLogHook.java
@@ -32,6 +32,7 @@
 
 import java.util.List;
 import java.util.function.Consumer;
+import java.util.function.Supplier;
 
 /**
  * JUnit Rule that adds a Calcite hook to log and remember Druid queries.
@@ -40,22 +41,22 @@ public class QueryLogHook implements TestRule
 {
   private static final Logger log = new Logger(QueryLogHook.class);
 
-  private final ObjectMapper objectMapper;
+  private final Supplier<ObjectMapper> objectMapperSupplier;
   private final List<Query<?>> recordedQueries = Lists.newCopyOnWriteArrayList();
 
-  public QueryLogHook(final ObjectMapper objectMapper)
+  public QueryLogHook(final Supplier<ObjectMapper> objectMapperSupplier)
   {
-    this.objectMapper = objectMapper;
+    this.objectMapperSupplier = objectMapperSupplier;
   }
 
   public static QueryLogHook create()
   {
-    return new QueryLogHook(new DefaultObjectMapper());
+    return new QueryLogHook(() -> DefaultObjectMapper.INSTANCE);
   }
 
   public static QueryLogHook create(final ObjectMapper objectMapper)
   {
-    return new QueryLogHook(objectMapper);
+    return new QueryLogHook(() -> objectMapper);
   }
 
   public void clearRecordedQueries()
@@ -83,7 +84,7 @@ public void evaluate() throws Throwable
             recordedQueries.add((Query<?>) query);
             log.info(
                 "Issued query: %s",
-                objectMapper.writerWithDefaultPrettyPrinter().writeValueAsString(query)
+                objectMapperSupplier.get().writerWithDefaultPrettyPrinter().writeValueAsString(query)
             );
           }
           catch (Exception e) {
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/util/SpecificSegmentsQuerySegmentWalker.java b/sql/src/test/java/org/apache/druid/sql/calcite/util/SpecificSegmentsQuerySegmentWalker.java
index ca312983ffd6..5ca07c83afc1 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/util/SpecificSegmentsQuerySegmentWalker.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/util/SpecificSegmentsQuerySegmentWalker.java
@@ -103,7 +103,6 @@ public SpecificSegmentsQuerySegmentWalker(
     this.walker = QueryStackTests.createClientQuerySegmentWalker(
         QueryStackTests.createClusterQuerySegmentWalker(
             timelines,
-            joinableFactoryWrapper,
             conglomerate,
             scheduler
         ),
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/util/SqlTestFramework.java b/sql/src/test/java/org/apache/druid/sql/calcite/util/SqlTestFramework.java
index 7d7a0b8fd5b7..051ad3477327 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/util/SqlTestFramework.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/util/SqlTestFramework.java
@@ -19,16 +19,17 @@
 
 package org.apache.druid.sql.calcite.util;
 
-import com.fasterxml.jackson.databind.Module;
 import com.fasterxml.jackson.databind.ObjectMapper;
-import com.fasterxml.jackson.databind.module.SimpleModule;
 import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
-import com.google.common.collect.Lists;
 import com.google.inject.Binder;
 import com.google.inject.Injector;
 import com.google.inject.Provides;
 import org.apache.druid.guice.DruidInjectorBuilder;
+import org.apache.druid.guice.ExpressionModule;
+import org.apache.druid.guice.LazySingleton;
+import org.apache.druid.guice.StartupInjectorBuilder;
+import org.apache.druid.initialization.CoreInjectorBuilder;
 import org.apache.druid.initialization.DruidModule;
 import org.apache.druid.java.util.common.RE;
 import org.apache.druid.java.util.common.io.Closer;
@@ -36,7 +37,6 @@
 import org.apache.druid.query.GlobalTableDataSource;
 import org.apache.druid.query.QueryRunnerFactoryConglomerate;
 import org.apache.druid.query.lookup.LookupExtractorFactoryContainerProvider;
-import org.apache.druid.query.lookup.LookupSerdeModule;
 import org.apache.druid.query.topn.TopNQueryConfig;
 import org.apache.druid.segment.join.JoinableFactoryWrapper;
 import org.apache.druid.server.QueryLifecycle;
@@ -45,7 +45,7 @@
 import org.apache.druid.server.security.AuthConfig;
 import org.apache.druid.server.security.AuthorizerMapper;
 import org.apache.druid.sql.SqlStatementFactory;
-import org.apache.druid.sql.calcite.external.ExternalDataSource;
+import org.apache.druid.sql.calcite.aggregation.SqlAggregationModule;
 import org.apache.druid.sql.calcite.planner.CalciteRulesManager;
 import org.apache.druid.sql.calcite.planner.DruidOperatorTable;
 import org.apache.druid.sql.calcite.planner.PlannerConfig;
@@ -61,12 +61,10 @@
 import org.apache.druid.sql.calcite.view.ViewManager;
 import org.apache.druid.timeline.DataSegment;
 
+import javax.inject.Singleton;
 import java.io.File;
 import java.io.IOException;
-import java.util.ArrayList;
-import java.util.HashMap;
-import java.util.List;
-import java.util.Map;
+import java.util.Properties;
 import java.util.Set;
 
 /**
@@ -123,6 +121,20 @@ public class SqlTestFramework
    */
   public interface QueryComponentSupplier
   {
+    /**
+     * Gather properties to be used within tests. Particularly useful when choosing
+     * among aggregator implementations: avoids the need to copy/paste code to select
+     * the desired implementation.
+     */
+    void gatherProperties(Properties properties);
+
+    /**
+     * Configure modules needed for tests. This is the preferred way to configure
+     * Jackson: include the production module in this method that includes the
+     * required Jackson configuration.
+     */
+    void configureGuice(DruidInjectorBuilder builder);
+
     QueryRunnerFactoryConglomerate createCongolmerate(
         Builder builder,
         Closer closer
@@ -130,7 +142,8 @@ QueryRunnerFactoryConglomerate createCongolmerate(
 
     SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
         QueryRunnerFactoryConglomerate conglomerate,
-        JoinableFactoryWrapper joinableFactory
+        JoinableFactoryWrapper joinableFactory,
+        Injector injector
     ) throws IOException;
 
     SqlEngine createEngine(
@@ -138,19 +151,16 @@ SqlEngine createEngine(
         ObjectMapper objectMapper
     );
 
-    DruidOperatorTable createOperatorTable();
-
-    ExprMacroTable createMacroTable();
-
-    Iterable<? extends Module> getJacksonModules();
-
-    Map<String, Object> getJacksonInjectables();
-
+    /**
+     * Configure the JSON mapper.
+     *
+     * @see {@link #configureGuice(DruidInjectorBuilder)} for the preferred solution.
+     */
     void configureJsonMapper(ObjectMapper mapper);
 
-    void configureGuice(DruidInjectorBuilder builder);
-
     JoinableFactoryWrapper createJoinableFactoryWrapper(LookupExtractorFactoryContainerProvider lookupProvider);
+
+    void finalizeTestFramework(SqlTestFramework sqlTestFramework);
   }
 
   public interface PlannerComponentSupplier
@@ -174,18 +184,25 @@ public interface PlannerComponentSupplier
    */
   public static class StandardComponentSupplier implements QueryComponentSupplier
   {
-    private final Injector injector;
     private final File temporaryFolder;
 
     public StandardComponentSupplier(
-        final Injector injector,
         final File temporaryFolder
     )
     {
-      this.injector = injector;
       this.temporaryFolder = temporaryFolder;
     }
 
+    @Override
+    public void gatherProperties(Properties properties)
+    {
+    }
+
+    @Override
+    public void configureGuice(DruidInjectorBuilder builder)
+    {
+    }
+
     @Override
     public QueryRunnerFactoryConglomerate createCongolmerate(
         Builder builder,
@@ -208,7 +225,8 @@ public QueryRunnerFactoryConglomerate createCongolmerate(
     @Override
     public SpecificSegmentsQuerySegmentWalker createQuerySegmentWalker(
         final QueryRunnerFactoryConglomerate conglomerate,
-        final JoinableFactoryWrapper joinableFactory
+        final JoinableFactoryWrapper joinableFactory,
+        final Injector injector
     )
     {
       return TestDataBuilder.createMockWalker(
@@ -229,42 +247,11 @@ public SqlEngine createEngine(QueryLifecycleFactory qlf, ObjectMapper objectMapp
       );
     }
 
-    @Override
-    public DruidOperatorTable createOperatorTable()
-    {
-      return QueryFrameworkUtils.createOperatorTable(injector);
-    }
-
-    @Override
-    public ExprMacroTable createMacroTable()
-    {
-      return QueryFrameworkUtils.createExprMacroTable(injector);
-    }
-
-    @Override
-    public Iterable<? extends Module> getJacksonModules()
-    {
-      final List<Module> modules = new ArrayList<>(new LookupSerdeModule().getJacksonModules());
-      modules.add(new SimpleModule().registerSubtypes(ExternalDataSource.class));
-      return modules;
-    }
-
-    @Override
-    public Map<String, Object> getJacksonInjectables()
-    {
-      return new HashMap<>();
-    }
-
     @Override
     public void configureJsonMapper(ObjectMapper mapper)
     {
     }
 
-    @Override
-    public void configureGuice(DruidInjectorBuilder builder)
-    {
-    }
-
     @Override
     public JoinableFactoryWrapper createJoinableFactoryWrapper(LookupExtractorFactoryContainerProvider lookupProvider)
     {
@@ -276,6 +263,11 @@ public JoinableFactoryWrapper createJoinableFactoryWrapper(LookupExtractorFactor
           )
       );
     }
+
+    @Override
+    public void finalizeTestFramework(SqlTestFramework sqlTestFramework)
+    {
+    }
   }
 
   public static class StandardPlannerComponentSupplier implements PlannerComponentSupplier
@@ -476,24 +468,19 @@ public TestSetupModule(Builder builder)
     @Override
     public void configure(Binder binder)
     {
-      binder.bind(DruidOperatorTable.class).toInstance(componentSupplier.createOperatorTable());
-      binder.bind(ExprMacroTable.class).toInstance(componentSupplier.createMacroTable());
+      binder.bind(DruidOperatorTable.class).in(LazySingleton.class);
       binder.bind(DataSegment.PruneSpecsHolder.class).toInstance(DataSegment.PruneSpecsHolder.DEFAULT);
     }
 
-    @Override
-    public List<? extends Module> getJacksonModules()
-    {
-      return Lists.newArrayList(componentSupplier.getJacksonModules());
-    }
-
     @Provides
+    @Singleton
     public QueryRunnerFactoryConglomerate conglomerate()
     {
       return componentSupplier.createCongolmerate(builder, resourceCloser);
     }
 
     @Provides
+    @Singleton
     public JoinableFactoryWrapper joinableFactoryWrapper(final Injector injector)
     {
       return builder.componentSupplier.createJoinableFactoryWrapper(
@@ -502,12 +489,14 @@ public JoinableFactoryWrapper joinableFactoryWrapper(final Injector injector)
     }
 
     @Provides
+    @LazySingleton
     public SpecificSegmentsQuerySegmentWalker segmentsQuerySegmentWalker(final Injector injector)
     {
       try {
         SpecificSegmentsQuerySegmentWalker walker = componentSupplier.createQuerySegmentWalker(
             injector.getInstance(QueryRunnerFactoryConglomerate.class),
-            injector.getInstance(JoinableFactoryWrapper.class)
+            injector.getInstance(JoinableFactoryWrapper.class),
+            injector
         );
         resourceCloser.register(walker);
         return walker;
@@ -518,6 +507,7 @@ public SpecificSegmentsQuerySegmentWalker segmentsQuerySegmentWalker(final Injec
     }
 
     @Provides
+    @Singleton
     public QueryLifecycleFactory queryLifecycleFactory(final Injector injector)
     {
       return QueryFrameworkUtils.createMockQueryLifecycleFactory(
@@ -538,11 +528,30 @@ public QueryLifecycleFactory queryLifecycleFactory(final Injector injector)
   private SqlTestFramework(Builder builder)
   {
     this.componentSupplier = builder.componentSupplier;
-    this.injector = new CalciteTestInjectorBuilder()
-      .addModule(new TestSetupModule(builder))
-      .build();
+    Properties properties = new Properties();
+    this.componentSupplier.gatherProperties(properties);
+    Injector startupInjector = new StartupInjectorBuilder()
+        .withProperties(properties)
+        .build();
+    DruidInjectorBuilder injectorBuilder = new CoreInjectorBuilder(startupInjector)
+        // Ignore load scopes. This is a unit test, not a Druid node. If a
+        // test pulls in a module, then pull in that module, even though we are
+        // not the Druid node to which the module is scoped.
+        .ignoreLoadScopes()
+        .addModule(new BasicTestModule())
+        .addModule(new SqlAggregationModule())
+        .addModule(new ExpressionModule())
+        .addModule(new TestSetupModule(builder));
+    builder.componentSupplier.configureGuice(injectorBuilder);
+    this.injector = injectorBuilder.build();
     this.engine = builder.componentSupplier.createEngine(queryLifecycleFactory(), queryJsonMapper());
     componentSupplier.configureJsonMapper(queryJsonMapper());
+    componentSupplier.finalizeTestFramework(this);
+  }
+
+  public Injector injector()
+  {
+    return injector;
   }
 
   public ObjectMapper queryJsonMapper()
diff --git a/sql/src/test/java/org/apache/druid/sql/calcite/util/TestDataBuilder.java b/sql/src/test/java/org/apache/druid/sql/calcite/util/TestDataBuilder.java
index d8daa6595594..07a9fbc30abf 100644
--- a/sql/src/test/java/org/apache/druid/sql/calcite/util/TestDataBuilder.java
+++ b/sql/src/test/java/org/apache/druid/sql/calcite/util/TestDataBuilder.java
@@ -19,6 +19,8 @@
 
 package org.apache.druid.sql.calcite.util;
 
+import com.fasterxml.jackson.core.JsonProcessingException;
+import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.ImmutableSet;
@@ -35,7 +37,10 @@
 import org.apache.druid.data.input.impl.StringDimensionSchema;
 import org.apache.druid.data.input.impl.TimeAndDimsParseSpec;
 import org.apache.druid.data.input.impl.TimestampSpec;
+import org.apache.druid.jackson.DefaultObjectMapper;
 import org.apache.druid.java.util.common.DateTimes;
+import org.apache.druid.java.util.common.Intervals;
+import org.apache.druid.java.util.common.RE;
 import org.apache.druid.query.DataSource;
 import org.apache.druid.query.GlobalTableDataSource;
 import org.apache.druid.query.InlineDataSource;
@@ -62,16 +67,24 @@
 import org.apache.druid.server.QueryStackTests;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.partition.LinearShardSpec;
+import org.apache.druid.timeline.partition.NumberedShardSpec;
 import org.joda.time.DateTime;
 import org.joda.time.chrono.ISOChronology;
 
+import java.io.BufferedReader;
 import java.io.File;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.InputStreamReader;
+import java.nio.charset.StandardCharsets;
+import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.List;
 import java.util.Map;
 import java.util.Optional;
 import java.util.Set;
 import java.util.stream.Collectors;
+import java.util.zip.GZIPInputStream;
 
 /**
  * Builds a set of test data used by the Calcite query tests. The test data is
@@ -119,14 +132,21 @@ public Optional<Joinable> build(
           new TimestampSpec(TIMESTAMP_COLUMN, "iso", null),
           new DimensionsSpec(
               ImmutableList.<DimensionSchema>builder()
-                  .addAll(DimensionsSpec.getDefaultSchemas(ImmutableList.of("dim1", "dim2", "dim3", "dim4", "dim5", "dim6")))
-                  .add(new DoubleDimensionSchema("d1"))
-                  .add(new DoubleDimensionSchema("d2"))
-                  .add(new FloatDimensionSchema("f1"))
-                  .add(new FloatDimensionSchema("f2"))
-                  .add(new LongDimensionSchema("l1"))
-                  .add(new LongDimensionSchema("l2"))
-                  .build()
+                           .addAll(DimensionsSpec.getDefaultSchemas(ImmutableList.of(
+                               "dim1",
+                               "dim2",
+                               "dim3",
+                               "dim4",
+                               "dim5",
+                               "dim6"
+                           )))
+                           .add(new DoubleDimensionSchema("d1"))
+                           .add(new DoubleDimensionSchema("d2"))
+                           .add(new FloatDimensionSchema("f1"))
+                           .add(new FloatDimensionSchema("f2"))
+                           .add(new LongDimensionSchema("l1"))
+                           .add(new LongDimensionSchema("l2"))
+                           .build()
           )
       )
   );
@@ -137,18 +157,18 @@ public Optional<Joinable> build(
           new DimensionsSpec(
               DimensionsSpec.getDefaultSchemas(
                   ImmutableList.<String>builder().add("dimHyperUnique")
-                                                 .add("dimMultivalEnumerated")
-                                                 .add("dimMultivalEnumerated2")
-                                                 .add("dimMultivalSequentialWithNulls")
-                                                 .add("dimSequential")
-                                                 .add("dimSequentialHalfNull")
-                                                 .add("dimUniform")
-                                                 .add("dimZipf")
-                                                 .add("metFloatNormal")
-                                                 .add("metFloatZipf")
-                                                 .add("metLongSequential")
-                                                 .add("metLongUniform")
-                                                 .build()
+                               .add("dimMultivalEnumerated")
+                               .add("dimMultivalEnumerated2")
+                               .add("dimMultivalSequentialWithNulls")
+                               .add("dimSequential")
+                               .add("dimSequentialHalfNull")
+                               .add("dimUniform")
+                               .add("dimZipf")
+                               .add("metFloatNormal")
+                               .add("metFloatZipf")
+                               .add("metLongSequential")
+                               .add("metLongUniform")
+                               .build()
               )
           )
       )
@@ -223,111 +243,111 @@ public Optional<Joinable> build(
 
   public static final List<ImmutableMap<String, Object>> RAW_ROWS1 = ImmutableList.of(
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-01")
-          .put("m1", "1.0")
-          .put("m2", "1.0")
-          .put("dim1", "")
-          .put("dim2", ImmutableList.of("a"))
-          .put("dim3", ImmutableList.of("a", "b"))
-          .build(),
+                  .put("t", "2000-01-01")
+                  .put("m1", "1.0")
+                  .put("m2", "1.0")
+                  .put("dim1", "")
+                  .put("dim2", ImmutableList.of("a"))
+                  .put("dim3", ImmutableList.of("a", "b"))
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-02")
-          .put("m1", "2.0")
-          .put("m2", "2.0")
-          .put("dim1", "10.1")
-          .put("dim2", ImmutableList.of())
-          .put("dim3", ImmutableList.of("b", "c"))
-          .build(),
+                  .put("t", "2000-01-02")
+                  .put("m1", "2.0")
+                  .put("m2", "2.0")
+                  .put("dim1", "10.1")
+                  .put("dim2", ImmutableList.of())
+                  .put("dim3", ImmutableList.of("b", "c"))
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-03")
-          .put("m1", "3.0")
-          .put("m2", "3.0")
-          .put("dim1", "2")
-          .put("dim2", ImmutableList.of(""))
-          .put("dim3", ImmutableList.of("d"))
-          .build(),
+                  .put("t", "2000-01-03")
+                  .put("m1", "3.0")
+                  .put("m2", "3.0")
+                  .put("dim1", "2")
+                  .put("dim2", ImmutableList.of(""))
+                  .put("dim3", ImmutableList.of("d"))
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2001-01-01")
-          .put("m1", "4.0")
-          .put("m2", "4.0")
-          .put("dim1", "1")
-          .put("dim2", ImmutableList.of("a"))
-          .put("dim3", ImmutableList.of(""))
-          .build(),
+                  .put("t", "2001-01-01")
+                  .put("m1", "4.0")
+                  .put("m2", "4.0")
+                  .put("dim1", "1")
+                  .put("dim2", ImmutableList.of("a"))
+                  .put("dim3", ImmutableList.of(""))
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2001-01-02")
-          .put("m1", "5.0")
-          .put("m2", "5.0")
-          .put("dim1", "def")
-          .put("dim2", ImmutableList.of("abc"))
-          .put("dim3", ImmutableList.of())
-          .build(),
+                  .put("t", "2001-01-02")
+                  .put("m1", "5.0")
+                  .put("m2", "5.0")
+                  .put("dim1", "def")
+                  .put("dim2", ImmutableList.of("abc"))
+                  .put("dim3", ImmutableList.of())
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2001-01-03")
-          .put("m1", "6.0")
-          .put("m2", "6.0")
-          .put("dim1", "abc")
-          .build()
+                  .put("t", "2001-01-03")
+                  .put("m1", "6.0")
+                  .put("m2", "6.0")
+                  .put("dim1", "abc")
+                  .build()
   );
 
   public static final List<InputRow> RAW_ROWS1_X = ImmutableList.of(
       createRow(
           ImmutableMap.<String, Object>builder()
-              .put("t", "2000-01-01")
-              .put("m1_x", "1.0")
-              .put("m2_x", "1.0")
-              .put("dim1_x", "")
-              .put("dim2_x", ImmutableList.of("a"))
-              .put("dim3_x", ImmutableList.of("a", "b"))
-              .build()
+                      .put("t", "2000-01-01")
+                      .put("m1_x", "1.0")
+                      .put("m2_x", "1.0")
+                      .put("dim1_x", "")
+                      .put("dim2_x", ImmutableList.of("a"))
+                      .put("dim3_x", ImmutableList.of("a", "b"))
+                      .build()
       ),
       createRow(
           ImmutableMap.<String, Object>builder()
-              .put("t", "2000-01-02")
-              .put("m1_x", "2.0")
-              .put("m2_x", "2.0")
-              .put("dim1_x", "10.1")
-              .put("dim2_x", ImmutableList.of())
-              .put("dim3_x", ImmutableList.of("b", "c"))
-              .build()
+                      .put("t", "2000-01-02")
+                      .put("m1_x", "2.0")
+                      .put("m2_x", "2.0")
+                      .put("dim1_x", "10.1")
+                      .put("dim2_x", ImmutableList.of())
+                      .put("dim3_x", ImmutableList.of("b", "c"))
+                      .build()
       ),
       createRow(
           ImmutableMap.<String, Object>builder()
-              .put("t", "2000-01-03")
-              .put("m1_x", "3.0")
-              .put("m2_x", "3.0")
-              .put("dim1_x", "2")
-              .put("dim2_x", ImmutableList.of(""))
-              .put("dim3_x", ImmutableList.of("d"))
-              .build()
+                      .put("t", "2000-01-03")
+                      .put("m1_x", "3.0")
+                      .put("m2_x", "3.0")
+                      .put("dim1_x", "2")
+                      .put("dim2_x", ImmutableList.of(""))
+                      .put("dim3_x", ImmutableList.of("d"))
+                      .build()
       ),
       createRow(
           ImmutableMap.<String, Object>builder()
-              .put("t", "2001-01-01")
-              .put("m1_x", "4.0")
-              .put("m2_x", "4.0")
-              .put("dim1_x", "1")
-              .put("dim2_x", ImmutableList.of("a"))
-              .put("dim3_x", ImmutableList.of(""))
-              .build()
+                      .put("t", "2001-01-01")
+                      .put("m1_x", "4.0")
+                      .put("m2_x", "4.0")
+                      .put("dim1_x", "1")
+                      .put("dim2_x", ImmutableList.of("a"))
+                      .put("dim3_x", ImmutableList.of(""))
+                      .build()
       ),
       createRow(
           ImmutableMap.<String, Object>builder()
-              .put("t", "2001-01-02")
-              .put("m1_x", "5.0")
-              .put("m2_x", "5.0")
-              .put("dim1_x", "def")
-              .put("dim2_x", ImmutableList.of("abc"))
-              .put("dim3_x", ImmutableList.of())
-              .build()
+                      .put("t", "2001-01-02")
+                      .put("m1_x", "5.0")
+                      .put("m2_x", "5.0")
+                      .put("dim1_x", "def")
+                      .put("dim2_x", ImmutableList.of("abc"))
+                      .put("dim3_x", ImmutableList.of())
+                      .build()
       ),
       createRow(
           ImmutableMap.<String, Object>builder()
-              .put("t", "2001-01-03")
-              .put("m1_x", "6.0")
-              .put("m2_x", "6.0")
-              .put("dim1_x", "abc")
-              .build()
+                      .put("t", "2001-01-03")
+                      .put("m1_x", "6.0")
+                      .put("m2_x", "6.0")
+                      .put("dim1_x", "abc")
+                      .build()
       )
   );
 
@@ -336,131 +356,131 @@ public Optional<Joinable> build(
 
   public static final List<ImmutableMap<String, Object>> RAW_ROWS1_WITH_NUMERIC_DIMS = ImmutableList.of(
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-01")
-          .put("m1", "1.0")
-          .put("m2", "1.0")
-          .put("d1", 1.0)
-          .put("f1", 1.0f)
-          .put("l1", 7L)
-          .put("dim1", "")
-          .put("dim2", ImmutableList.of("a"))
-          .put("dim3", ImmutableList.of("a", "b"))
-          .put("dim4", "a")
-          .put("dim5", "aa")
-          .put("dim6", "1")
-          .build(),
+                  .put("t", "2000-01-01")
+                  .put("m1", "1.0")
+                  .put("m2", "1.0")
+                  .put("d1", 1.0)
+                  .put("f1", 1.0f)
+                  .put("l1", 7L)
+                  .put("dim1", "")
+                  .put("dim2", ImmutableList.of("a"))
+                  .put("dim3", ImmutableList.of("a", "b"))
+                  .put("dim4", "a")
+                  .put("dim5", "aa")
+                  .put("dim6", "1")
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-02")
-          .put("m1", "2.0")
-          .put("m2", "2.0")
-          .put("d1", 1.7)
-          .put("d2", 1.7)
-          .put("f1", 0.1f)
-          .put("f2", 0.1f)
-          .put("l1", 325323L)
-          .put("l2", 325323L)
-          .put("dim1", "10.1")
-          .put("dim2", ImmutableList.of())
-          .put("dim3", ImmutableList.of("b", "c"))
-          .put("dim4", "a")
-          .put("dim5", "ab")
-          .put("dim6", "2")
-          .build(),
+                  .put("t", "2000-01-02")
+                  .put("m1", "2.0")
+                  .put("m2", "2.0")
+                  .put("d1", 1.7)
+                  .put("d2", 1.7)
+                  .put("f1", 0.1f)
+                  .put("f2", 0.1f)
+                  .put("l1", 325323L)
+                  .put("l2", 325323L)
+                  .put("dim1", "10.1")
+                  .put("dim2", ImmutableList.of())
+                  .put("dim3", ImmutableList.of("b", "c"))
+                  .put("dim4", "a")
+                  .put("dim5", "ab")
+                  .put("dim6", "2")
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-03")
-          .put("m1", "3.0")
-          .put("m2", "3.0")
-          .put("d1", 0.0)
-          .put("d2", 0.0)
-          .put("f1", 0.0)
-          .put("f2", 0.0)
-          .put("l1", 0)
-          .put("l2", 0)
-          .put("dim1", "2")
-          .put("dim2", ImmutableList.of(""))
-          .put("dim3", ImmutableList.of("d"))
-          .put("dim4", "a")
-          .put("dim5", "ba")
-          .put("dim6", "3")
-          .build(),
+                  .put("t", "2000-01-03")
+                  .put("m1", "3.0")
+                  .put("m2", "3.0")
+                  .put("d1", 0.0)
+                  .put("d2", 0.0)
+                  .put("f1", 0.0)
+                  .put("f2", 0.0)
+                  .put("l1", 0)
+                  .put("l2", 0)
+                  .put("dim1", "2")
+                  .put("dim2", ImmutableList.of(""))
+                  .put("dim3", ImmutableList.of("d"))
+                  .put("dim4", "a")
+                  .put("dim5", "ba")
+                  .put("dim6", "3")
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2001-01-01")
-          .put("m1", "4.0")
-          .put("m2", "4.0")
-          .put("dim1", "1")
-          .put("dim2", ImmutableList.of("a"))
-          .put("dim3", ImmutableList.of(""))
-          .put("dim4", "b")
-          .put("dim5", "ad")
-          .put("dim6", "4")
-          .build(),
+                  .put("t", "2001-01-01")
+                  .put("m1", "4.0")
+                  .put("m2", "4.0")
+                  .put("dim1", "1")
+                  .put("dim2", ImmutableList.of("a"))
+                  .put("dim3", ImmutableList.of(""))
+                  .put("dim4", "b")
+                  .put("dim5", "ad")
+                  .put("dim6", "4")
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2001-01-02")
-          .put("m1", "5.0")
-          .put("m2", "5.0")
-          .put("dim1", "def")
-          .put("dim2", ImmutableList.of("abc"))
-          .put("dim3", ImmutableList.of())
-          .put("dim4", "b")
-          .put("dim5", "aa")
-          .put("dim6", "5")
-          .build(),
+                  .put("t", "2001-01-02")
+                  .put("m1", "5.0")
+                  .put("m2", "5.0")
+                  .put("dim1", "def")
+                  .put("dim2", ImmutableList.of("abc"))
+                  .put("dim3", ImmutableList.of())
+                  .put("dim4", "b")
+                  .put("dim5", "aa")
+                  .put("dim6", "5")
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2001-01-03")
-          .put("m1", "6.0")
-          .put("m2", "6.0")
-          .put("dim1", "abc")
-          .put("dim4", "b")
-          .put("dim5", "ab")
-          .put("dim6", "6")
-          .build()
+                  .put("t", "2001-01-03")
+                  .put("m1", "6.0")
+                  .put("m2", "6.0")
+                  .put("dim1", "abc")
+                  .put("dim4", "b")
+                  .put("dim5", "ab")
+                  .put("dim6", "6")
+                  .build()
   );
   public static final List<InputRow> ROWS1_WITH_NUMERIC_DIMS =
       RAW_ROWS1_WITH_NUMERIC_DIMS.stream().map(raw -> createRow(raw, PARSER_NUMERIC_DIMS)).collect(Collectors.toList());
 
   public static final List<ImmutableMap<String, Object>> RAW_ROWS2 = ImmutableList.of(
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-01")
-          .put("dim1", "דרואיד")
-          .put("dim2", "he")
-          .put("dim3", 10L)
-          .put("m1", 1.0)
-          .build(),
+                  .put("t", "2000-01-01")
+                  .put("dim1", "דרואיד")
+                  .put("dim2", "he")
+                  .put("dim3", 10L)
+                  .put("m1", 1.0)
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-01")
-          .put("dim1", "druid")
-          .put("dim2", "en")
-          .put("dim3", 11L)
-          .put("m1", 1.0)
-          .build(),
+                  .put("t", "2000-01-01")
+                  .put("dim1", "druid")
+                  .put("dim2", "en")
+                  .put("dim3", 11L)
+                  .put("m1", 1.0)
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-01")
-          .put("dim1", "друид")
-          .put("dim2", "ru")
-          .put("dim3", 12L)
-          .put("m1", 1.0)
-          .build()
+                  .put("t", "2000-01-01")
+                  .put("dim1", "друид")
+                  .put("dim2", "ru")
+                  .put("dim3", 12L)
+                  .put("m1", 1.0)
+                  .build()
   );
   public static final List<InputRow> ROWS2 =
       RAW_ROWS2.stream().map(TestDataBuilder::createRow).collect(Collectors.toList());
 
   public static final List<ImmutableMap<String, Object>> RAW_ROWS1_WITH_FULL_TIMESTAMP = ImmutableList.of(
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-01T10:51:45.695Z")
-          .put("m1", "1.0")
-          .put("m2", "1.0")
-          .put("dim1", "")
-          .put("dim2", ImmutableList.of("a"))
-          .put("dim3", ImmutableList.of("a", "b"))
-          .build(),
+                  .put("t", "2000-01-01T10:51:45.695Z")
+                  .put("m1", "1.0")
+                  .put("m2", "1.0")
+                  .put("dim1", "")
+                  .put("dim2", ImmutableList.of("a"))
+                  .put("dim3", ImmutableList.of("a", "b"))
+                  .build(),
       ImmutableMap.<String, Object>builder()
-          .put("t", "2000-01-18T10:51:45.695Z")
-          .put("m1", "2.0")
-          .put("m2", "2.0")
-          .put("dim1", "10.1")
-          .put("dim2", ImmutableList.of())
-          .put("dim3", ImmutableList.of("b", "c"))
-          .build()
+                  .put("t", "2000-01-18T10:51:45.695Z")
+                  .put("m1", "2.0")
+                  .put("m2", "2.0")
+                  .put("dim1", "10.1")
+                  .put("dim2", ImmutableList.of())
+                  .put("dim3", ImmutableList.of("b", "c"))
+                  .build()
   );
   public static final List<InputRow> ROWS1_WITH_FULL_TIMESTAMP =
       RAW_ROWS1_WITH_FULL_TIMESTAMP.stream().map(TestDataBuilder::createRow).collect(Collectors.toList());
@@ -475,36 +495,36 @@ public Optional<Joinable> build(
   public static final List<InputRow> ROWS_LOTS_OF_COLUMNS = ImmutableList.of(
       createRow(
           ImmutableMap.<String, Object>builder()
-              .put("timestamp", 1576306800000L)
-              .put("metFloatZipf", 147.0)
-              .put("dimMultivalSequentialWithNulls", Arrays.asList("1", "2", "3", "4", "5", "6", "7", "8"))
-              .put("dimMultivalEnumerated2", Arrays.asList(null, "Orange", "Apple"))
-              .put("metLongUniform", 372)
-              .put("metFloatNormal", 5000.0)
-              .put("dimZipf", "27")
-              .put("dimUniform", "74416")
-              .put("dimMultivalEnumerated", Arrays.asList("Baz", "World", "Hello", "Baz"))
-              .put("metLongSequential", 0)
-              .put("dimHyperUnique", "0")
-              .put("dimSequential", "0")
-              .put("dimSequentialHalfNull", "0")
-              .build(),
+                      .put("timestamp", 1576306800000L)
+                      .put("metFloatZipf", 147.0)
+                      .put("dimMultivalSequentialWithNulls", Arrays.asList("1", "2", "3", "4", "5", "6", "7", "8"))
+                      .put("dimMultivalEnumerated2", Arrays.asList(null, "Orange", "Apple"))
+                      .put("metLongUniform", 372)
+                      .put("metFloatNormal", 5000.0)
+                      .put("dimZipf", "27")
+                      .put("dimUniform", "74416")
+                      .put("dimMultivalEnumerated", Arrays.asList("Baz", "World", "Hello", "Baz"))
+                      .put("metLongSequential", 0)
+                      .put("dimHyperUnique", "0")
+                      .put("dimSequential", "0")
+                      .put("dimSequentialHalfNull", "0")
+                      .build(),
           PARSER_LOTS_OF_COLUMNS
       ),
       createRow(
           ImmutableMap.<String, Object>builder()
-              .put("timestamp", 1576306800000L)
-              .put("metFloatZipf", 25.0)
-              .put("dimMultivalEnumerated2", Arrays.asList("Xylophone", null, "Corundum"))
-              .put("metLongUniform", 252)
-              .put("metFloatNormal", 4999.0)
-              .put("dimZipf", "9")
-              .put("dimUniform", "50515")
-              .put("dimMultivalEnumerated", Arrays.asList("Baz", "World", "ㅑ ㅓ ㅕ ㅗ ㅛ ㅜ ㅠ ㅡ ㅣ"))
-              .put("metLongSequential", 8)
-              .put("dimHyperUnique", "8")
-              .put("dimSequential", "8")
-              .build(),
+                      .put("timestamp", 1576306800000L)
+                      .put("metFloatZipf", 25.0)
+                      .put("dimMultivalEnumerated2", Arrays.asList("Xylophone", null, "Corundum"))
+                      .put("metLongUniform", 252)
+                      .put("metFloatNormal", 4999.0)
+                      .put("dimZipf", "9")
+                      .put("dimUniform", "50515")
+                      .put("dimMultivalEnumerated", Arrays.asList("Baz", "World", "ㅑ ㅓ ㅕ ㅗ ㅛ ㅜ ㅠ ㅡ ㅣ"))
+                      .put("metLongSequential", 8)
+                      .put("dimHyperUnique", "8")
+                      .put("dimSequential", "8")
+                      .build(),
           PARSER_LOTS_OF_COLUMNS
       )
   );
@@ -575,6 +595,88 @@ public Optional<Joinable> build(
       DateTimes.nowUtc().toString()
   );
 
+  public static QueryableIndex makeWikipediaIndex(File tmpDir)
+  {
+    final List<DimensionSchema> dimensions = Arrays.asList(
+        new StringDimensionSchema("channel"),
+        new StringDimensionSchema("cityName"),
+        new StringDimensionSchema("comment"),
+        new StringDimensionSchema("countryIsoCode"),
+        new StringDimensionSchema("countryName"),
+        new StringDimensionSchema("isAnonymous"),
+        new StringDimensionSchema("isMinor"),
+        new StringDimensionSchema("isNew"),
+        new StringDimensionSchema("isRobot"),
+        new StringDimensionSchema("isUnpatrolled"),
+        new StringDimensionSchema("metroCode"),
+        new StringDimensionSchema("namespace"),
+        new StringDimensionSchema("page"),
+        new StringDimensionSchema("regionIsoCode"),
+        new StringDimensionSchema("regionName"),
+        new StringDimensionSchema("user"),
+        new LongDimensionSchema("delta"),
+        new LongDimensionSchema("added"),
+        new LongDimensionSchema("deleted")
+    );
+    ArrayList<String> dimensionNames = new ArrayList<>(dimensions.size());
+    for (DimensionSchema dimension : dimensions) {
+      dimensionNames.add(dimension.getName());
+    }
+
+    return IndexBuilder
+        .create()
+        .tmpDir(new File(tmpDir, "wikipedia1"))
+        .segmentWriteOutMediumFactory(OffHeapMemorySegmentWriteOutMediumFactory.instance())
+        .schema(new IncrementalIndexSchema.Builder()
+                    .withRollup(false)
+                    .withDimensionsSpec(new DimensionsSpec(dimensions))
+                    .build()
+        )
+        .rows(
+            () -> {
+              final InputStream is;
+              try {
+                is = new GZIPInputStream(
+                    // The extension ".json.gz" appears to not be included in resource bundles, so name it ".jgz"!
+                    ClassLoader.getSystemResourceAsStream("calcite/tests/wikiticker-2015-09-12-sampled.jgz")
+                );
+              }
+              catch (IOException e) {
+                throw new RE(e, "problem loading wikipedia dataset for tests");
+              }
+
+              ObjectMapper mapper = new DefaultObjectMapper();
+
+              // This method is returning an iterator over a BufferedReader, attempts are made to try to close the reader if
+              // exceptions occur, but this is happening in test setup and failures here should generally fail the tests, so
+              // leaks are not a primary concern.  If anything were to actually try to mimic this code in real life, it should
+              // do a better job of taking care of resources.
+              BufferedReader lines = new BufferedReader(new InputStreamReader(is, StandardCharsets.UTF_8));
+              return lines
+                  .lines()
+                  .map(line -> {
+                    try {
+                      Map map = mapper.readValue(line, Map.class);
+                      final String time = String.valueOf(map.get("time"));
+                      return (InputRow) new MapBasedInputRow(DateTimes.of(time), dimensionNames, map);
+                    }
+                    catch (JsonProcessingException e) {
+                      final RE toThrow = new RE(e, "Problem reading line setting up wikipedia dataset for tests.");
+                      try {
+                        is.close();
+                      }
+                      catch (IOException logged) {
+                        toThrow.addSuppressed(logged);
+                      }
+                      throw toThrow;
+                    }
+                  })
+                  .iterator();
+            }
+        )
+        .buildMMappedIndex();
+  }
+
   public static SpecificSegmentsQuerySegmentWalker createMockWalker(
       final Injector injector,
       final QueryRunnerFactoryConglomerate conglomerate,
@@ -712,7 +814,6 @@ public static SpecificSegmentsQuerySegmentWalker createMockWalker(
         .rows(USER_VISIT_ROWS)
         .buildMMappedIndex();
 
-
     return new SpecificSegmentsQuerySegmentWalker(
         conglomerate,
         injector.getInstance(LookupExtractorFactoryContainerProvider.class),
@@ -808,6 +909,15 @@ public static SpecificSegmentsQuerySegmentWalker createMockWalker(
                    .size(0)
                    .build(),
         userVisitIndex
+    ).add(
+        DataSegment.builder()
+                   .dataSource("wikipedia")
+                   .interval(Intervals.of("2015-09-12/2015-09-13"))
+                   .version("1")
+                   .shardSpec(new NumberedShardSpec(0, 0))
+                   .size(0)
+                   .build(),
+        makeWikipediaIndex(tmpDir)
     );
   }
 
@@ -815,6 +925,7 @@ private static MapBasedInputRow toRow(String time, List<String> dimensions, Map<
   {
     return new MapBasedInputRow(DateTimes.ISO_DATE_OPTIONAL_TIME.parse(time), dimensions, event);
   }
+
   public static InputRow createRow(final ImmutableMap<String, ?> map)
   {
     return PARSER.parseBatch((Map<String, Object>) map).get(0);
diff --git a/sql/src/test/java/org/apache/druid/sql/http/SqlResourceTest.java b/sql/src/test/java/org/apache/druid/sql/http/SqlResourceTest.java
index d3287530c55b..42fa66cbaa71 100644
--- a/sql/src/test/java/org/apache/druid/sql/http/SqlResourceTest.java
+++ b/sql/src/test/java/org/apache/druid/sql/http/SqlResourceTest.java
@@ -425,15 +425,9 @@ public void testSqlLifecycleMetrics() throws Exception
     );
     checkSqlRequestLog(true);
     Assert.assertTrue(lifecycleManager.getAll("id").isEmpty());
-    Set<String> metricNames = ImmutableSet.of("sqlQuery/time", "sqlQuery/bytes", "sqlQuery/planningTimeMs");
-    Assert.assertEquals(3, stubServiceEmitter.getEvents().size());
-    for (String metricName : metricNames) {
-      Assert.assertTrue(
-          stubServiceEmitter.getEvents()
-                            .stream()
-                            .anyMatch(event -> event.toMap().containsValue(metricName))
-      );
-    }
+    stubServiceEmitter.verifyEmitted("sqlQuery/time", 1);
+    stubServiceEmitter.verifyValue("sqlQuery/bytes", 27L);
+    stubServiceEmitter.verifyEmitted("sqlQuery/planningTimeMs", 1);
   }
 
 
diff --git a/sql/src/test/resources/calcite/expected/ingest/httpExtern-logicalPlan.txt b/sql/src/test/resources/calcite/expected/ingest/httpExtern-logicalPlan.txt
new file mode 100644
index 000000000000..23c84ffd547f
--- /dev/null
+++ b/sql/src/test/resources/calcite/expected/ingest/httpExtern-logicalPlan.txt
@@ -0,0 +1,3 @@
+LogicalInsert(target=[dst], partitionedBy=[AllGranularity], clusteredBy=[<none>])
+  LogicalProject(x=[$0], y=[$1], z=[$2])
+    ExternalTableScan(dataSource=[{"type":"external","inputSource":{"type":"http","uris":["http:foo.com/bar.csv"],"httpAuthenticationUsername":"bob","httpAuthenticationPassword":{"type":"default","password":"secret"}},"inputFormat":{"type":"csv","columns":["x","y","z"]},"signature":[{"name":"x","type":"STRING"},{"name":"y","type":"STRING"},{"name":"z","type":"LONG"}]}])
diff --git a/sql/src/test/resources/calcite/expected/ingest/insertFromExternal-logicalPlan.txt b/sql/src/test/resources/calcite/expected/ingest/insertFromExternal-logicalPlan.txt
new file mode 100644
index 000000000000..01252a96a133
--- /dev/null
+++ b/sql/src/test/resources/calcite/expected/ingest/insertFromExternal-logicalPlan.txt
@@ -0,0 +1,3 @@
+LogicalInsert(target=[dst], partitionedBy=[AllGranularity], clusteredBy=[<none>])
+  LogicalProject(x=[$0], y=[$1], z=[$2])
+    ExternalTableScan(dataSource=[{"type":"external","inputSource":{"type":"inline","data":"a,b,1\nc,d,2\n"},"inputFormat":{"type":"csv","columns":["x","y","z"]},"signature":[{"name":"x","type":"STRING"},{"name":"y","type":"STRING"},{"name":"z","type":"LONG"}]}])
diff --git a/sql/src/test/resources/calcite/expected/ingest/insertWithClusteredBy-logicalPlan.txt b/sql/src/test/resources/calcite/expected/ingest/insertWithClusteredBy-logicalPlan.txt
new file mode 100644
index 000000000000..eb2d8501d5a1
--- /dev/null
+++ b/sql/src/test/resources/calcite/expected/ingest/insertWithClusteredBy-logicalPlan.txt
@@ -0,0 +1,4 @@
+LogicalInsert(target=[druid.dst], partitionedBy=[{type=period, period=P1D, timeZone=UTC, origin=null}], clusteredBy=[2, `dim1` DESC, CEIL(`m2`)])
+  LogicalSort(sort0=[$1], sort1=[$2], sort2=[$3], dir0=[ASC], dir1=[DESC], dir2=[ASC])
+    LogicalProject(__time=[$0], floor_m1=[FLOOR($5)], dim1=[$1], ceil_m2=[CEIL($6)])
+      LogicalTableScan(table=[[druid, foo]])
diff --git a/sql/src/test/resources/calcite/expected/ingest/insertWithPartitionedBy-logicalPlan.txt b/sql/src/test/resources/calcite/expected/ingest/insertWithPartitionedBy-logicalPlan.txt
new file mode 100644
index 000000000000..730e4adb15a5
--- /dev/null
+++ b/sql/src/test/resources/calcite/expected/ingest/insertWithPartitionedBy-logicalPlan.txt
@@ -0,0 +1,3 @@
+LogicalInsert(target=[druid.dst], partitionedBy=[{type=period, period=PT1H, timeZone=UTC, origin=null}], clusteredBy=[<none>])
+  LogicalProject(__time=[$0], floor_m1=[FLOOR($5)], dim1=[$1])
+    LogicalTableScan(table=[[druid, foo]])
diff --git a/sql/src/test/resources/calcite/expected/ingest/localExtern-logicalPlan.txt b/sql/src/test/resources/calcite/expected/ingest/localExtern-logicalPlan.txt
new file mode 100644
index 000000000000..759a1587460b
--- /dev/null
+++ b/sql/src/test/resources/calcite/expected/ingest/localExtern-logicalPlan.txt
@@ -0,0 +1,3 @@
+LogicalInsert(target=[dst], partitionedBy=[AllGranularity], clusteredBy=[<none>])
+  LogicalProject(x=[$0], y=[$1], z=[$2])
+    ExternalTableScan(dataSource=[{"type":"external","inputSource":{"type":"local","files":["/tmp/foo.csv","/tmp/bar.csv"]},"inputFormat":{"type":"csv","columns":["x","y","z"]},"signature":[{"name":"x","type":"STRING"},{"name":"y","type":"STRING"},{"name":"z","type":"LONG"}]}])
diff --git a/sql/src/test/resources/calcite/tests/wikiticker-2015-09-12-sampled.jgz b/sql/src/test/resources/calcite/tests/wikiticker-2015-09-12-sampled.jgz
new file mode 100644
index 000000000000..6ca3233b777c
Binary files /dev/null and b/sql/src/test/resources/calcite/tests/wikiticker-2015-09-12-sampled.jgz differ
diff --git a/sql/src/test/resources/calcite/tests/window/simpleSum.sqlTest b/sql/src/test/resources/calcite/tests/window/simpleSum.sqlTest
new file mode 100644
index 000000000000..d10e710c5d45
--- /dev/null
+++ b/sql/src/test/resources/calcite/tests/window/simpleSum.sqlTest
@@ -0,0 +1,25 @@
+type: "operatorValidation"
+
+sql: "
+    SELECT
+      FLOOR(__time TO DAY) t,
+      SUM(cnt) c,
+      SUM(SUM(cnt)) OVER (ORDER BY FLOOR(__time TO DAY)) cc
+    FROM foo
+    GROUP BY FLOOR(__time TO DAY)"
+
+expectedOperators:
+  - { type: "naivePartition", partitionColumns: [ ] }
+  - type: "window"
+    processor:
+      type: "aggregate"
+      cumulativeAggregations:
+        - { type: "longSum", name: "w0", fieldName: "a0" }
+
+expectedResults:
+  - [946684800000, 1, 1]
+  - [946771200000, 1, 2]
+  - [946857600000, 1, 3]
+  - [978307200000, 1, 4]
+  - [978393600000, 1, 5]
+  - [978480000000, 1, 6]
diff --git a/sql/src/test/resources/calcite/tests/window/wikipediaCumulativeOrdered.sqlTest b/sql/src/test/resources/calcite/tests/window/wikipediaCumulativeOrdered.sqlTest
new file mode 100644
index 000000000000..e87e1db391e0
--- /dev/null
+++ b/sql/src/test/resources/calcite/tests/window/wikipediaCumulativeOrdered.sqlTest
@@ -0,0 +1,1028 @@
+type: "operatorValidation"
+
+sql: "
+    SELECT
+      countryIsoCode, 
+      FLOOR(__time TO HOUR) t, 
+      SUM(delta) delta, 
+      SUM(SUM(delta)) OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) totalDelta, 
+      LAG(FLOOR(__time TO HOUR),  2) OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) laggardTime, 
+      LEAD(FLOOR(__time TO HOUR),  1) OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) leadTime, 
+      FIRST_VALUE(SUM(delta)) OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) AS firstDelay, 
+      LAST_VALUE(SUM(delta)) OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) AS lastDelay, 
+      NTILE(3) OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) AS delayNTile, 
+      RANK() OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) AS delayRank, 
+      PERCENT_RANK() OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) AS delayRankPercent, 
+      DENSE_RANK() OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) AS delayRankDense, 
+      CUME_DIST() OVER (PARTITION BY countryIsoCode ORDER BY SUM(delta)) AS delayCumeDist
+    FROM wikipedia
+    GROUP BY 1, 2
+    ORDER BY 1, 3"
+
+expectedOperators:
+  - { type: "naivePartition",  partitionColumns: ["d0"] }
+  - type: "window"
+    processor:
+      type: "composing"
+      processors:
+       - {"type":"offset", "inputColumn":"d1", "outputColumn":"w1", "offset":-2}
+       - {"type":"offset", "inputColumn":"d1", "outputColumn":"w2", "offset":1}
+       - {"type":"first", "inputColumn":"a0", "outputColumn":"w3"}
+       - {"type":"last", "inputColumn":"a0", "outputColumn":"w4"}
+       - {"type":"percentile", "outputColumn":"w5", "numBuckets":3}
+       - {"type":"rank", "group":["a0"], "outputColumn":"w6", "asPercent":false}
+       - {"type":"rank", "group":["a0"], "outputColumn":"w7", "asPercent":true}
+       - {"type":"denseRank", "group":["a0"], "outputColumn":"w8"}
+       - {"type":"cumeDist", "group":["a0"], "outputColumn":"w9"}
+       - type: "aggregate"
+         cumulativeAggregations:
+         - {"type":"longSum", "name":"w0", "fieldName":"a0"}
+
+expectedResults:
+  - ["", 1442016000000, 29873, 29873, null, 1442030400000, 29873, 787370, 1, 1, 0.0, 1, 0.041666666666666664]
+  - ["", 1442030400000, 166672, 196545, null, 1442019600000, 29873, 787370, 1, 2, 0.043478260869565216, 2, 0.08333333333333333]
+  - ["", 1442019600000, 173892, 370437, 1442016000000, 1442037600000, 29873, 787370, 1, 3, 0.08695652173913043, 3, 0.125]
+  - ["", 1442037600000, 200605, 571042, 1442030400000, 1442026800000, 29873, 787370, 1, 4, 0.13043478260869565, 4, 0.16666666666666666]
+  - ["", 1442026800000, 252626, 823668, 1442019600000, 1442098800000, 29873, 787370, 1, 5, 0.17391304347826086, 5, 0.20833333333333334]
+  - ["", 1442098800000, 276159, 1099827, 1442037600000, 1442055600000, 29873, 787370, 1, 6, 0.21739130434782608, 6, 0.25]
+  - ["", 1442055600000, 283958, 1383785, 1442026800000, 1442088000000, 29873, 787370, 1, 7, 0.2608695652173913, 7, 0.2916666666666667]
+  - ["", 1442088000000, 303872, 1687657, 1442098800000, 1442048400000, 29873, 787370, 1, 8, 0.30434782608695654, 8, 0.3333333333333333]
+  - ["", 1442048400000, 308316, 1995973, 1442055600000, 1442044800000, 29873, 787370, 2, 9, 0.34782608695652173, 9, 0.375]
+  - ["", 1442044800000, 316002, 2311975, 1442088000000, 1442034000000, 29873, 787370, 2, 10, 0.391304347826087, 10, 0.4166666666666667]
+  - ["", 1442034000000, 330957, 2642932, 1442048400000, 1442066400000, 29873, 787370, 2, 11, 0.43478260869565216, 11, 0.4583333333333333]
+  - ["", 1442066400000, 351584, 2994516, 1442044800000, 1442070000000, 29873, 787370, 2, 12, 0.4782608695652174, 12, 0.5]
+  - ["", 1442070000000, 358515, 3353031, 1442034000000, 1442084400000, 29873, 787370, 2, 13, 0.5217391304347826, 13, 0.5416666666666666]
+  - ["", 1442084400000, 372569, 3725600, 1442066400000, 1442095200000, 29873, 787370, 2, 14, 0.5652173913043478, 14, 0.5833333333333334]
+  - ["", 1442095200000, 374501, 4100101, 1442070000000, 1442073600000, 29873, 787370, 2, 15, 0.6086956521739131, 15, 0.625]
+  - ["", 1442073600000, 375394, 4475495, 1442084400000, 1442062800000, 29873, 787370, 2, 16, 0.6521739130434783, 16, 0.6666666666666666]
+  - ["", 1442062800000, 389465, 4864960, 1442095200000, 1442077200000, 29873, 787370, 3, 17, 0.6956521739130435, 17, 0.7083333333333334]
+  - ["", 1442077200000, 392483, 5257443, 1442073600000, 1442023200000, 29873, 787370, 3, 18, 0.7391304347826086, 18, 0.75]
+  - ["", 1442023200000, 399636, 5657079, 1442062800000, 1442080800000, 29873, 787370, 3, 19, 0.782608695652174, 19, 0.7916666666666666]
+  - ["", 1442080800000, 453077, 6110156, 1442077200000, 1442059200000, 29873, 787370, 3, 20, 0.8260869565217391, 20, 0.8333333333333334]
+  - ["", 1442059200000, 459297, 6569453, 1442023200000, 1442091600000, 29873, 787370, 3, 21, 0.8695652173913043, 21, 0.875]
+  - ["", 1442091600000, 514427, 7083880, 1442080800000, 1442041200000, 29873, 787370, 3, 22, 0.9130434782608695, 22, 0.9166666666666666]
+  - ["", 1442041200000, 543450, 7627330, 1442059200000, 1442052000000, 29873, 787370, 3, 23, 0.9565217391304348, 23, 0.9583333333333334]
+  - ["", 1442052000000, 787370, 8414700, 1442091600000, null, 29873, 787370, 3, 24, 1.0, 24, 1.0]
+  - ["AE", 1442059200000, -11, -11, null, 1442044800000, -11, 6323, 1, 1, 0.0, 1, 0.125]
+  - ["AE", 1442044800000, -7, -18, null, 1442052000000, -11, 6323, 1, 2, 0.14285714285714285, 2, 0.25]
+  - ["AE", 1442052000000, -3, -21, 1442059200000, 1442048400000, -11, 6323, 1, 3, 0.2857142857142857, 3, 0.375]
+  - ["AE", 1442048400000, 39, 18, 1442044800000, 1442080800000, -11, 6323, 2, 4, 0.42857142857142855, 4, 0.5]
+  - ["AE", 1442080800000, 42, 60, 1442052000000, 1442070000000, -11, 6323, 2, 5, 0.5714285714285714, 5, 0.625]
+  - ["AE", 1442070000000, 46, 106, 1442048400000, 1442030400000, -11, 6323, 2, 6, 0.7142857142857143, 6, 0.75]
+  - ["AE", 1442030400000, 118, 224, 1442080800000, 1442077200000, -11, 6323, 3, 7, 0.8571428571428571, 7, 0.875]
+  - ["AE", 1442077200000, 6323, 6547, 1442070000000, null, -11, 6323, 3, 8, 1.0, 8, 1.0]
+  - ["AL", 1442077200000, 26, 26, null, 1442091600000, 26, 54, 1, 1, 0.0, 1, 0.5]
+  - ["AL", 1442091600000, 54, 80, null, null, 26, 54, 2, 2, 1.0, 2, 1.0]
+  - ["AO", 1442041200000, -26, -26, null, 1442052000000, -26, 722, 1, 1, 0.0, 1, 0.25]
+  - ["AO", 1442052000000, -18, -44, null, 1442088000000, -26, 722, 1, 2, 0.3333333333333333, 2, 0.5]
+  - ["AO", 1442088000000, 62, 18, 1442041200000, 1442098800000, -26, 722, 2, 3, 0.6666666666666666, 3, 0.75]
+  - ["AO", 1442098800000, 722, 740, 1442052000000, null, -26, 722, 3, 4, 1.0, 4, 1.0]
+  - ["AR", 1442077200000, -591, -591, null, 1442055600000, -591, 2514, 1, 1, 0.0, 1, 0.058823529411764705]
+  - ["AR", 1442055600000, -54, -645, null, 1442084400000, -591, 2514, 1, 2, 0.0625, 2, 0.11764705882352941]
+  - ["AR", 1442084400000, -5, -650, 1442077200000, 1442030400000, -591, 2514, 1, 3, 0.125, 3, 0.17647058823529413]
+  - ["AR", 1442030400000, -3, -653, 1442055600000, 1442066400000, -591, 2514, 1, 4, 0.1875, 4, 0.23529411764705882]
+  - ["AR", 1442066400000, 0, -653, 1442084400000, 1442019600000, -591, 2514, 1, 5, 0.25, 5, 0.29411764705882354]
+  - ["AR", 1442019600000, 1, -652, 1442030400000, 1442080800000, -591, 2514, 1, 6, 0.3125, 6, 0.4117647058823529]
+  - ["AR", 1442080800000, 1, -651, 1442066400000, 1442062800000, -591, 2514, 2, 6, 0.3125, 6, 0.4117647058823529]
+  - ["AR", 1442062800000, 29, -622, 1442019600000, 1442098800000, -591, 2514, 2, 8, 0.4375, 7, 0.47058823529411764]
+  - ["AR", 1442098800000, 64, -558, 1442080800000, 1442037600000, -591, 2514, 2, 9, 0.5, 8, 0.5294117647058824]
+  - ["AR", 1442037600000, 81, -477, 1442062800000, 1442059200000, -591, 2514, 2, 10, 0.5625, 9, 0.5882352941176471]
+  - ["AR", 1442059200000, 210, -267, 1442098800000, 1442034000000, -591, 2514, 2, 11, 0.625, 10, 0.6470588235294118]
+  - ["AR", 1442034000000, 212, -55, 1442037600000, 1442091600000, -591, 2514, 2, 12, 0.6875, 11, 0.7058823529411765]
+  - ["AR", 1442091600000, 340, 285, 1442059200000, 1442070000000, -591, 2514, 3, 13, 0.75, 12, 0.7647058823529411]
+  - ["AR", 1442070000000, 377, 662, 1442034000000, 1442095200000, -591, 2514, 3, 14, 0.8125, 13, 0.8235294117647058]
+  - ["AR", 1442095200000, 630, 1292, 1442091600000, 1442026800000, -591, 2514, 3, 15, 0.875, 14, 0.8823529411764706]
+  - ["AR", 1442026800000, 644, 1936, 1442070000000, 1442023200000, -591, 2514, 3, 16, 0.9375, 15, 0.9411764705882353]
+  - ["AR", 1442023200000, 2514, 4450, 1442095200000, null, -591, 2514, 3, 17, 1.0, 16, 1.0]
+  - ["AT", 1442062800000, -155, -155, null, 1442084400000, -155, 7050, 1, 1, 0.0, 1, 0.14285714285714285]
+  - ["AT", 1442084400000, -2, -157, null, 1442066400000, -155, 7050, 1, 2, 0.16666666666666666, 2, 0.2857142857142857]
+  - ["AT", 1442066400000, 0, -157, 1442062800000, 1442091600000, -155, 7050, 1, 3, 0.3333333333333333, 3, 0.42857142857142855]
+  - ["AT", 1442091600000, 89, -68, 1442084400000, 1442070000000, -155, 7050, 2, 4, 0.5, 4, 0.5714285714285714]
+  - ["AT", 1442070000000, 272, 204, 1442066400000, 1442052000000, -155, 7050, 2, 5, 0.6666666666666666, 5, 0.7142857142857143]
+  - ["AT", 1442052000000, 4793, 4997, 1442091600000, 1442088000000, -155, 7050, 3, 6, 0.8333333333333334, 6, 0.8571428571428571]
+  - ["AT", 1442088000000, 7050, 12047, 1442070000000, null, -155, 7050, 3, 7, 1.0, 7, 1.0]
+  - ["AU", 1442052000000, -643, -643, null, 1442030400000, -643, 1138, 1, 1, 0.0, 1, 0.05263157894736842]
+  - ["AU", 1442030400000, -377, -1020, null, 1442066400000, -643, 1138, 1, 2, 0.05555555555555555, 2, 0.10526315789473684]
+  - ["AU", 1442066400000, -21, -1041, 1442052000000, 1442070000000, -643, 1138, 1, 3, 0.1111111111111111, 3, 0.15789473684210525]
+  - ["AU", 1442070000000, -12, -1053, 1442030400000, 1442016000000, -643, 1138, 1, 4, 0.16666666666666666, 4, 0.21052631578947367]
+  - ["AU", 1442016000000, 0, -1053, 1442066400000, 1442077200000, -643, 1138, 1, 5, 0.2222222222222222, 5, 0.2631578947368421]
+  - ["AU", 1442077200000, 1, -1052, 1442070000000, 1442037600000, -643, 1138, 1, 6, 0.2777777777777778, 6, 0.3157894736842105]
+  - ["AU", 1442037600000, 3, -1049, 1442016000000, 1442059200000, -643, 1138, 1, 7, 0.3333333333333333, 7, 0.3684210526315789]
+  - ["AU", 1442059200000, 38, -1011, 1442077200000, 1442023200000, -643, 1138, 2, 8, 0.3888888888888889, 8, 0.42105263157894735]
+  - ["AU", 1442023200000, 52, -959, 1442037600000, 1442048400000, -643, 1138, 2, 9, 0.4444444444444444, 9, 0.47368421052631576]
+  - ["AU", 1442048400000, 135, -824, 1442059200000, 1442055600000, -643, 1138, 2, 10, 0.5, 10, 0.5263157894736842]
+  - ["AU", 1442055600000, 182, -642, 1442023200000, 1442026800000, -643, 1138, 2, 11, 0.5555555555555556, 11, 0.5789473684210527]
+  - ["AU", 1442026800000, 188, -454, 1442048400000, 1442041200000, -643, 1138, 2, 12, 0.6111111111111112, 12, 0.631578947368421]
+  - ["AU", 1442041200000, 194, -260, 1442055600000, 1442019600000, -643, 1138, 2, 13, 0.6666666666666666, 13, 0.6842105263157895]
+  - ["AU", 1442019600000, 253, -7, 1442026800000, 1442034000000, -643, 1138, 3, 14, 0.7222222222222222, 14, 0.7368421052631579]
+  - ["AU", 1442034000000, 283, 276, 1442041200000, 1442044800000, -643, 1138, 3, 15, 0.7777777777777778, 15, 0.7894736842105263]
+  - ["AU", 1442044800000, 373, 649, 1442019600000, 1442095200000, -643, 1138, 3, 16, 0.8333333333333334, 16, 0.8421052631578947]
+  - ["AU", 1442095200000, 395, 1044, 1442034000000, 1442098800000, -643, 1138, 3, 17, 0.8888888888888888, 17, 0.8947368421052632]
+  - ["AU", 1442098800000, 518, 1562, 1442044800000, 1442091600000, -643, 1138, 3, 18, 0.9444444444444444, 18, 0.9473684210526315]
+  - ["AU", 1442091600000, 1138, 2700, 1442095200000, null, -643, 1138, 3, 19, 1.0, 19, 1.0]
+  - ["BA", 1442055600000, -202, -202, null, 1442048400000, -202, 38, 1, 1, 0.0, 1, 0.25]
+  - ["BA", 1442048400000, -13, -215, null, 1442084400000, -202, 38, 1, 2, 0.3333333333333333, 2, 0.5]
+  - ["BA", 1442084400000, -1, -216, 1442055600000, 1442052000000, -202, 38, 2, 3, 0.6666666666666666, 3, 0.75]
+  - ["BA", 1442052000000, 38, -178, 1442048400000, null, -202, 38, 3, 4, 1.0, 4, 1.0]
+  - ["BD", 1442091600000, -2, -2, null, 1442019600000, -2, 854, 1, 1, 0.0, 1, 0.16666666666666666]
+  - ["BD", 1442019600000, 0, -2, null, 1442077200000, -2, 854, 1, 2, 0.2, 2, 0.3333333333333333]
+  - ["BD", 1442077200000, 75, 73, 1442091600000, 1442066400000, -2, 854, 2, 3, 0.4, 3, 0.5]
+  - ["BD", 1442066400000, 76, 149, 1442019600000, 1442073600000, -2, 854, 2, 4, 0.6, 4, 0.6666666666666666]
+  - ["BD", 1442073600000, 103, 252, 1442077200000, 1442041200000, -2, 854, 3, 5, 0.8, 5, 0.8333333333333334]
+  - ["BD", 1442041200000, 854, 1106, 1442066400000, null, -2, 854, 3, 6, 1.0, 6, 1.0]
+  - ["BE", 1442030400000, -103, -103, null, 1442052000000, -103, 233, 1, 1, 0.0, 1, 0.08333333333333333]
+  - ["BE", 1442052000000, -1, -104, null, 1442080800000, -103, 233, 1, 2, 0.09090909090909091, 2, 0.16666666666666666]
+  - ["BE", 1442080800000, 1, -103, 1442030400000, 1442098800000, -103, 233, 1, 3, 0.18181818181818182, 3, 0.25]
+  - ["BE", 1442098800000, 9, -94, 1442052000000, 1442073600000, -103, 233, 1, 4, 0.2727272727272727, 4, 0.3333333333333333]
+  - ["BE", 1442073600000, 19, -75, 1442080800000, 1442048400000, -103, 233, 2, 5, 0.36363636363636365, 5, 0.4166666666666667]
+  - ["BE", 1442048400000, 59, -16, 1442098800000, 1442088000000, -103, 233, 2, 6, 0.45454545454545453, 6, 0.5]
+  - ["BE", 1442088000000, 67, 51, 1442073600000, 1442062800000, -103, 233, 2, 7, 0.5454545454545454, 7, 0.5833333333333334]
+  - ["BE", 1442062800000, 91, 142, 1442048400000, 1442091600000, -103, 233, 2, 8, 0.6363636363636364, 8, 0.6666666666666666]
+  - ["BE", 1442091600000, 101, 243, 1442088000000, 1442066400000, -103, 233, 3, 9, 0.7272727272727273, 9, 0.75]
+  - ["BE", 1442066400000, 136, 379, 1442062800000, 1442084400000, -103, 233, 3, 10, 0.8181818181818182, 10, 0.8333333333333334]
+  - ["BE", 1442084400000, 183, 562, 1442091600000, 1442055600000, -103, 233, 3, 11, 0.9090909090909091, 11, 0.9166666666666666]
+  - ["BE", 1442055600000, 233, 795, 1442066400000, null, -103, 233, 3, 12, 1.0, 12, 1.0]
+  - ["BG", 1442041200000, 9, 9, null, 1442070000000, 9, 18936, 1, 1, 0.0, 1, 0.2]
+  - ["BG", 1442070000000, 55, 64, null, 1442059200000, 9, 18936, 1, 2, 0.25, 2, 0.4]
+  - ["BG", 1442059200000, 191, 255, 1442041200000, 1442084400000, 9, 18936, 2, 3, 0.5, 3, 0.6]
+  - ["BG", 1442084400000, 401, 656, 1442070000000, 1442052000000, 9, 18936, 2, 4, 0.75, 4, 0.8]
+  - ["BG", 1442052000000, 18936, 19592, 1442059200000, null, 9, 18936, 3, 5, 1.0, 5, 1.0]
+  - ["BH", 1442052000000, 44, 44, null, null, 44, 44, 1, 1, 0.0, 1, 1.0]
+  - ["BO", 1442095200000, -4, -4, null, 1442080800000, -4, 4, 1, 1, 0.0, 1, 0.3333333333333333]
+  - ["BO", 1442080800000, 4, 0, null, 1442088000000, -4, 4, 2, 2, 0.5, 2, 1.0]
+  - ["BO", 1442088000000, 4, 4, 1442095200000, null, -4, 4, 3, 2, 0.5, 2, 1.0]
+  - ["BR", 1442098800000, -645, -645, null, 1442080800000, -645, 2253, 1, 1, 0.0, 1, 0.043478260869565216]
+  - ["BR", 1442080800000, -267, -912, null, 1442016000000, -645, 2253, 1, 2, 0.045454545454545456, 2, 0.08695652173913043]
+  - ["BR", 1442016000000, -248, -1160, 1442098800000, 1442041200000, -645, 2253, 1, 3, 0.09090909090909091, 3, 0.13043478260869565]
+  - ["BR", 1442041200000, 3, -1157, 1442080800000, 1442091600000, -645, 2253, 1, 4, 0.13636363636363635, 4, 0.17391304347826086]
+  - ["BR", 1442091600000, 11, -1146, 1442016000000, 1442034000000, -645, 2253, 1, 5, 0.18181818181818182, 5, 0.21739130434782608]
+  - ["BR", 1442034000000, 21, -1125, 1442041200000, 1442030400000, -645, 2253, 1, 6, 0.22727272727272727, 6, 0.2608695652173913]
+  - ["BR", 1442030400000, 30, -1095, 1442091600000, 1442026800000, -645, 2253, 1, 7, 0.2727272727272727, 7, 0.30434782608695654]
+  - ["BR", 1442026800000, 51, -1044, 1442034000000, 1442044800000, -645, 2253, 1, 8, 0.3181818181818182, 8, 0.34782608695652173]
+  - ["BR", 1442044800000, 71, -973, 1442030400000, 1442059200000, -645, 2253, 2, 9, 0.36363636363636365, 9, 0.391304347826087]
+  - ["BR", 1442059200000, 73, -900, 1442026800000, 1442062800000, -645, 2253, 2, 10, 0.4090909090909091, 10, 0.43478260869565216]
+  - ["BR", 1442062800000, 93, -807, 1442044800000, 1442088000000, -645, 2253, 2, 11, 0.45454545454545453, 11, 0.4782608695652174]
+  - ["BR", 1442088000000, 215, -592, 1442059200000, 1442052000000, -645, 2253, 2, 12, 0.5, 12, 0.5217391304347826]
+  - ["BR", 1442052000000, 232, -360, 1442062800000, 1442055600000, -645, 2253, 2, 13, 0.5454545454545454, 13, 0.5652173913043478]
+  - ["BR", 1442055600000, 242, -118, 1442088000000, 1442037600000, -645, 2253, 2, 14, 0.5909090909090909, 14, 0.6086956521739131]
+  - ["BR", 1442037600000, 267, 149, 1442052000000, 1442019600000, -645, 2253, 2, 15, 0.6363636363636364, 15, 0.6521739130434783]
+  - ["BR", 1442019600000, 372, 521, 1442055600000, 1442084400000, -645, 2253, 2, 16, 0.6818181818181818, 16, 0.6956521739130435]
+  - ["BR", 1442084400000, 492, 1013, 1442037600000, 1442070000000, -645, 2253, 3, 17, 0.7272727272727273, 17, 0.7391304347826086]
+  - ["BR", 1442070000000, 536, 1549, 1442019600000, 1442095200000, -645, 2253, 3, 18, 0.7727272727272727, 18, 0.782608695652174]
+  - ["BR", 1442095200000, 748, 2297, 1442084400000, 1442023200000, -645, 2253, 3, 19, 0.8181818181818182, 19, 0.8260869565217391]
+  - ["BR", 1442023200000, 879, 3176, 1442070000000, 1442066400000, -645, 2253, 3, 20, 0.8636363636363636, 20, 0.8695652173913043]
+  - ["BR", 1442066400000, 1034, 4210, 1442095200000, 1442073600000, -645, 2253, 3, 21, 0.9090909090909091, 21, 0.9130434782608695]
+  - ["BR", 1442073600000, 2087, 6297, 1442023200000, 1442077200000, -645, 2253, 3, 22, 0.9545454545454546, 22, 0.9565217391304348]
+  - ["BR", 1442077200000, 2253, 8550, 1442066400000, null, -645, 2253, 3, 23, 1.0, 23, 1.0]
+  - ["BY", 1442055600000, 1, 1, null, 1442084400000, 1, 1464, 1, 1, 0.0, 1, 0.2857142857142857]
+  - ["BY", 1442084400000, 1, 2, null, 1442080800000, 1, 1464, 1, 1, 0.0, 1, 0.2857142857142857]
+  - ["BY", 1442080800000, 28, 30, 1442055600000, 1442077200000, 1, 1464, 1, 3, 0.3333333333333333, 2, 0.42857142857142855]
+  - ["BY", 1442077200000, 30, 60, 1442084400000, 1442088000000, 1, 1464, 2, 4, 0.5, 3, 0.5714285714285714]
+  - ["BY", 1442088000000, 33, 93, 1442080800000, 1442073600000, 1, 1464, 2, 5, 0.6666666666666666, 4, 0.7142857142857143]
+  - ["BY", 1442073600000, 596, 689, 1442077200000, 1442059200000, 1, 1464, 3, 6, 0.8333333333333334, 5, 0.8571428571428571]
+  - ["BY", 1442059200000, 1464, 2153, 1442088000000, null, 1, 1464, 3, 7, 1.0, 6, 1.0]
+  - ["CA", 1442016000000, -371, -371, null, 1442062800000, -371, 2858, 1, 1, 0.0, 1, 0.045454545454545456]
+  - ["CA", 1442062800000, -367, -738, null, 1442095200000, -371, 2858, 1, 2, 0.047619047619047616, 2, 0.09090909090909091]
+  - ["CA", 1442095200000, -361, -1099, 1442016000000, 1442077200000, -371, 2858, 1, 3, 0.09523809523809523, 3, 0.13636363636363635]
+  - ["CA", 1442077200000, -282, -1381, 1442062800000, 1442037600000, -371, 2858, 1, 4, 0.14285714285714285, 4, 0.18181818181818182]
+  - ["CA", 1442037600000, -132, -1513, 1442095200000, 1442030400000, -371, 2858, 1, 5, 0.19047619047619047, 5, 0.22727272727272727]
+  - ["CA", 1442030400000, -47, -1560, 1442077200000, 1442044800000, -371, 2858, 1, 6, 0.23809523809523808, 6, 0.2727272727272727]
+  - ["CA", 1442044800000, 1, -1559, 1442037600000, 1442041200000, -371, 2858, 1, 7, 0.2857142857142857, 7, 0.3181818181818182]
+  - ["CA", 1442041200000, 5, -1554, 1442030400000, 1442088000000, -371, 2858, 1, 8, 0.3333333333333333, 8, 0.36363636363636365]
+  - ["CA", 1442088000000, 35, -1519, 1442044800000, 1442052000000, -371, 2858, 2, 9, 0.38095238095238093, 9, 0.4090909090909091]
+  - ["CA", 1442052000000, 38, -1481, 1442041200000, 1442084400000, -371, 2858, 2, 10, 0.42857142857142855, 10, 0.45454545454545453]
+  - ["CA", 1442084400000, 44, -1437, 1442088000000, 1442073600000, -371, 2858, 2, 11, 0.47619047619047616, 11, 0.5]
+  - ["CA", 1442073600000, 86, -1351, 1442052000000, 1442098800000, -371, 2858, 2, 12, 0.5238095238095238, 12, 0.5454545454545454]
+  - ["CA", 1442098800000, 164, -1187, 1442084400000, 1442034000000, -371, 2858, 2, 13, 0.5714285714285714, 13, 0.5909090909090909]
+  - ["CA", 1442034000000, 178, -1009, 1442073600000, 1442070000000, -371, 2858, 2, 14, 0.6190476190476191, 14, 0.6363636363636364]
+  - ["CA", 1442070000000, 185, -824, 1442098800000, 1442023200000, -371, 2858, 2, 15, 0.6666666666666666, 15, 0.6818181818181818]
+  - ["CA", 1442023200000, 286, -538, 1442034000000, 1442066400000, -371, 2858, 3, 16, 0.7142857142857143, 16, 0.7272727272727273]
+  - ["CA", 1442066400000, 307, -231, 1442070000000, 1442080800000, -371, 2858, 3, 17, 0.7619047619047619, 17, 0.7727272727272727]
+  - ["CA", 1442080800000, 481, 250, 1442023200000, 1442059200000, -371, 2858, 3, 18, 0.8095238095238095, 18, 0.8181818181818182]
+  - ["CA", 1442059200000, 1036, 1286, 1442066400000, 1442019600000, -371, 2858, 3, 19, 0.8571428571428571, 19, 0.8636363636363636]
+  - ["CA", 1442019600000, 2184, 3470, 1442080800000, 1442026800000, -371, 2858, 3, 20, 0.9047619047619048, 20, 0.9090909090909091]
+  - ["CA", 1442026800000, 2216, 5686, 1442059200000, 1442091600000, -371, 2858, 3, 21, 0.9523809523809523, 21, 0.9545454545454546]
+  - ["CA", 1442091600000, 2858, 8544, 1442019600000, null, -371, 2858, 3, 22, 1.0, 22, 1.0]
+  - ["CH", 1442044800000, -54, -54, null, 1442055600000, -54, 360, 1, 1, 0.0, 1, 0.08333333333333333]
+  - ["CH", 1442055600000, 0, -54, null, 1442077200000, -54, 360, 1, 2, 0.09090909090909091, 2, 0.16666666666666666]
+  - ["CH", 1442077200000, 6, -48, 1442044800000, 1442070000000, -54, 360, 1, 3, 0.18181818181818182, 3, 0.25]
+  - ["CH", 1442070000000, 11, -37, 1442055600000, 1442084400000, -54, 360, 1, 4, 0.2727272727272727, 4, 0.3333333333333333]
+  - ["CH", 1442084400000, 13, -24, 1442077200000, 1442062800000, -54, 360, 2, 5, 0.36363636363636365, 5, 0.4166666666666667]
+  - ["CH", 1442062800000, 22, -2, 1442070000000, 1442048400000, -54, 360, 2, 6, 0.45454545454545453, 6, 0.5]
+  - ["CH", 1442048400000, 24, 22, 1442084400000, 1442052000000, -54, 360, 2, 7, 0.5454545454545454, 7, 0.5833333333333334]
+  - ["CH", 1442052000000, 47, 69, 1442062800000, 1442037600000, -54, 360, 2, 8, 0.6363636363636364, 8, 0.6666666666666666]
+  - ["CH", 1442037600000, 59, 128, 1442048400000, 1442091600000, -54, 360, 3, 9, 0.7272727272727273, 9, 0.75]
+  - ["CH", 1442091600000, 67, 195, 1442052000000, 1442041200000, -54, 360, 3, 10, 0.8181818181818182, 10, 0.8333333333333334]
+  - ["CH", 1442041200000, 198, 393, 1442037600000, 1442073600000, -54, 360, 3, 11, 0.9090909090909091, 11, 0.9166666666666666]
+  - ["CH", 1442073600000, 360, 753, 1442091600000, null, -54, 360, 3, 12, 1.0, 12, 1.0]
+  - ["CL", 1442019600000, -370, -370, null, 1442095200000, -370, 390, 1, 1, 0.0, 1, 0.05]
+  - ["CL", 1442095200000, -276, -646, null, 1442066400000, -370, 390, 1, 2, 0.05263157894736842, 2, 0.1]
+  - ["CL", 1442066400000, -41, -687, 1442019600000, 1442077200000, -370, 390, 1, 3, 0.10526315789473684, 3, 0.15]
+  - ["CL", 1442077200000, -15, -702, 1442095200000, 1442059200000, -370, 390, 1, 4, 0.15789473684210525, 4, 0.2]
+  - ["CL", 1442059200000, -12, -714, 1442066400000, 1442034000000, -370, 390, 1, 5, 0.21052631578947367, 5, 0.25]
+  - ["CL", 1442034000000, -1, -715, 1442077200000, 1442041200000, -370, 390, 1, 6, 0.2631578947368421, 6, 0.35]
+  - ["CL", 1442041200000, -1, -716, 1442059200000, 1442037600000, -370, 390, 1, 6, 0.2631578947368421, 6, 0.35]
+  - ["CL", 1442037600000, 2, -714, 1442034000000, 1442098800000, -370, 390, 2, 8, 0.3684210526315789, 7, 0.4]
+  - ["CL", 1442098800000, 9, -705, 1442041200000, 1442070000000, -370, 390, 2, 9, 0.42105263157894735, 8, 0.45]
+  - ["CL", 1442070000000, 13, -692, 1442037600000, 1442023200000, -370, 390, 2, 10, 0.47368421052631576, 9, 0.5]
+  - ["CL", 1442023200000, 15, -677, 1442098800000, 1442062800000, -370, 390, 2, 11, 0.5263157894736842, 10, 0.55]
+  - ["CL", 1442062800000, 17, -660, 1442070000000, 1442080800000, -370, 390, 2, 12, 0.5789473684210527, 11, 0.65]
+  - ["CL", 1442080800000, 17, -643, 1442023200000, 1442091600000, -370, 390, 2, 12, 0.5789473684210527, 11, 0.65]
+  - ["CL", 1442091600000, 20, -623, 1442062800000, 1442030400000, -370, 390, 2, 14, 0.6842105263157895, 12, 0.7]
+  - ["CL", 1442030400000, 40, -583, 1442080800000, 1442084400000, -370, 390, 3, 15, 0.7368421052631579, 13, 0.75]
+  - ["CL", 1442084400000, 126, -457, 1442091600000, 1442073600000, -370, 390, 3, 16, 0.7894736842105263, 14, 0.8]
+  - ["CL", 1442073600000, 153, -304, 1442030400000, 1442016000000, -370, 390, 3, 17, 0.8421052631578947, 15, 0.85]
+  - ["CL", 1442016000000, 161, -143, 1442084400000, 1442088000000, -370, 390, 3, 18, 0.8947368421052632, 16, 0.9]
+  - ["CL", 1442088000000, 286, 143, 1442073600000, 1442052000000, -370, 390, 3, 19, 0.9473684210526315, 17, 0.95]
+  - ["CL", 1442052000000, 390, 533, 1442016000000, null, -370, 390, 3, 20, 1.0, 18, 1.0]
+  - ["CN", 1442066400000, -15, -15, null, 1442023200000, -15, 293, 1, 1, 0.0, 1, 0.1]
+  - ["CN", 1442023200000, -13, -28, null, 1442080800000, -15, 293, 1, 2, 0.1111111111111111, 2, 0.2]
+  - ["CN", 1442080800000, -10, -38, 1442066400000, 1442084400000, -15, 293, 1, 3, 0.2222222222222222, 3, 0.3]
+  - ["CN", 1442084400000, -1, -39, 1442023200000, 1442052000000, -15, 293, 1, 4, 0.3333333333333333, 4, 0.4]
+  - ["CN", 1442052000000, 0, -39, 1442080800000, 1442059200000, -15, 293, 2, 5, 0.4444444444444444, 5, 0.5]
+  - ["CN", 1442059200000, 8, -31, 1442084400000, 1442055600000, -15, 293, 2, 6, 0.5555555555555556, 6, 0.6]
+  - ["CN", 1442055600000, 69, 38, 1442052000000, 1442037600000, -15, 293, 2, 7, 0.6666666666666666, 7, 0.7]
+  - ["CN", 1442037600000, 98, 136, 1442059200000, 1442026800000, -15, 293, 3, 8, 0.7777777777777778, 8, 0.8]
+  - ["CN", 1442026800000, 154, 290, 1442055600000, 1442048400000, -15, 293, 3, 9, 0.8888888888888888, 9, 0.9]
+  - ["CN", 1442048400000, 293, 583, 1442037600000, null, -15, 293, 3, 10, 1.0, 10, 1.0]
+  - ["CO", 1442070000000, -45, -45, null, 1442023200000, -45, 39860, 1, 1, 0.0, 1, 0.06666666666666667]
+  - ["CO", 1442023200000, 9, -36, null, 1442019600000, -45, 39860, 1, 2, 0.07142857142857142, 2, 0.13333333333333333]
+  - ["CO", 1442019600000, 12, -24, 1442070000000, 1442016000000, -45, 39860, 1, 3, 0.14285714285714285, 3, 0.2]
+  - ["CO", 1442016000000, 16, -8, 1442023200000, 1442080800000, -45, 39860, 1, 4, 0.21428571428571427, 4, 0.26666666666666666]
+  - ["CO", 1442080800000, 25, 17, 1442019600000, 1442084400000, -45, 39860, 1, 5, 0.2857142857142857, 5, 0.3333333333333333]
+  - ["CO", 1442084400000, 51, 68, 1442016000000, 1442098800000, -45, 39860, 2, 6, 0.35714285714285715, 6, 0.4]
+  - ["CO", 1442098800000, 83, 151, 1442080800000, 1442066400000, -45, 39860, 2, 7, 0.42857142857142855, 7, 0.4666666666666667]
+  - ["CO", 1442066400000, 288, 439, 1442084400000, 1442095200000, -45, 39860, 2, 8, 0.5, 8, 0.5333333333333333]
+  - ["CO", 1442095200000, 290, 729, 1442098800000, 1442091600000, -45, 39860, 2, 9, 0.5714285714285714, 9, 0.6]
+  - ["CO", 1442091600000, 377, 1106, 1442066400000, 1442030400000, -45, 39860, 2, 10, 0.6428571428571429, 10, 0.6666666666666666]
+  - ["CO", 1442030400000, 441, 1547, 1442095200000, 1442059200000, -45, 39860, 3, 11, 0.7142857142857143, 11, 0.7333333333333333]
+  - ["CO", 1442059200000, 473, 2020, 1442091600000, 1442077200000, -45, 39860, 3, 12, 0.7857142857142857, 12, 0.8]
+  - ["CO", 1442077200000, 581, 2601, 1442030400000, 1442088000000, -45, 39860, 3, 13, 0.8571428571428571, 13, 0.8666666666666667]
+  - ["CO", 1442088000000, 17150, 19751, 1442059200000, 1442073600000, -45, 39860, 3, 14, 0.9285714285714286, 14, 0.9333333333333333]
+  - ["CO", 1442073600000, 39860, 59611, 1442077200000, null, -45, 39860, 3, 15, 1.0, 15, 1.0]
+  - ["CR", 1442041200000, 51, 51, null, 1442019600000, 51, 2497, 1, 1, 0.0, 1, 0.125]
+  - ["CR", 1442019600000, 62, 113, null, 1442023200000, 51, 2497, 1, 2, 0.14285714285714285, 2, 0.375]
+  - ["CR", 1442023200000, 62, 175, 1442041200000, 1442088000000, 51, 2497, 1, 2, 0.14285714285714285, 2, 0.375]
+  - ["CR", 1442088000000, 72, 247, 1442019600000, 1442026800000, 51, 2497, 2, 4, 0.42857142857142855, 3, 0.5]
+  - ["CR", 1442026800000, 140, 387, 1442023200000, 1442048400000, 51, 2497, 2, 5, 0.5714285714285714, 4, 0.625]
+  - ["CR", 1442048400000, 163, 550, 1442088000000, 1442044800000, 51, 2497, 2, 6, 0.7142857142857143, 5, 0.75]
+  - ["CR", 1442044800000, 194, 744, 1442026800000, 1442030400000, 51, 2497, 3, 7, 0.8571428571428571, 6, 0.875]
+  - ["CR", 1442030400000, 2497, 3241, 1442048400000, null, 51, 2497, 3, 8, 1.0, 7, 1.0]
+  - ["CZ", 1442080800000, -28, -28, null, 1442026800000, -28, 2051, 1, 1, 0.0, 1, 0.09090909090909091]
+  - ["CZ", 1442026800000, -19, -47, null, 1442062800000, -28, 2051, 1, 2, 0.1, 2, 0.18181818181818182]
+  - ["CZ", 1442062800000, 0, -47, 1442080800000, 1442098800000, -28, 2051, 1, 3, 0.2, 3, 0.2727272727272727]
+  - ["CZ", 1442098800000, 2, -45, 1442026800000, 1442037600000, -28, 2051, 1, 4, 0.3, 4, 0.36363636363636365]
+  - ["CZ", 1442037600000, 18, -27, 1442062800000, 1442059200000, -28, 2051, 2, 5, 0.4, 5, 0.45454545454545453]
+  - ["CZ", 1442059200000, 21, -6, 1442098800000, 1442034000000, -28, 2051, 2, 6, 0.5, 6, 0.5454545454545454]
+  - ["CZ", 1442034000000, 78, 72, 1442037600000, 1442077200000, -28, 2051, 2, 7, 0.6, 7, 0.6363636363636364]
+  - ["CZ", 1442077200000, 115, 187, 1442059200000, 1442070000000, -28, 2051, 2, 8, 0.7, 8, 0.7272727272727273]
+  - ["CZ", 1442070000000, 168, 355, 1442034000000, 1442055600000, -28, 2051, 3, 9, 0.8, 9, 0.8181818181818182]
+  - ["CZ", 1442055600000, 1073, 1428, 1442077200000, 1442073600000, -28, 2051, 3, 10, 0.9, 10, 0.9090909090909091]
+  - ["CZ", 1442073600000, 2051, 3479, 1442070000000, null, -28, 2051, 3, 11, 1.0, 11, 1.0]
+  - ["DE", 1442084400000, -125, -125, null, 1442019600000, -125, 6075, 1, 1, 0.0, 1, 0.043478260869565216]
+  - ["DE", 1442019600000, 0, -125, null, 1442023200000, -125, 6075, 1, 2, 0.045454545454545456, 2, 0.08695652173913043]
+  - ["DE", 1442023200000, 64, -61, 1442084400000, 1442016000000, -125, 6075, 1, 3, 0.09090909090909091, 3, 0.13043478260869565]
+  - ["DE", 1442016000000, 167, 106, 1442019600000, 1442088000000, -125, 6075, 1, 4, 0.13636363636363635, 4, 0.17391304347826086]
+  - ["DE", 1442088000000, 190, 296, 1442023200000, 1442041200000, -125, 6075, 1, 5, 0.18181818181818182, 5, 0.21739130434782608]
+  - ["DE", 1442041200000, 197, 493, 1442016000000, 1442062800000, -125, 6075, 1, 6, 0.22727272727272727, 6, 0.2608695652173913]
+  - ["DE", 1442062800000, 283, 776, 1442088000000, 1442059200000, -125, 6075, 1, 7, 0.2727272727272727, 7, 0.30434782608695654]
+  - ["DE", 1442059200000, 289, 1065, 1442041200000, 1442098800000, -125, 6075, 1, 8, 0.3181818181818182, 8, 0.34782608695652173]
+  - ["DE", 1442098800000, 329, 1394, 1442062800000, 1442034000000, -125, 6075, 2, 9, 0.36363636363636365, 9, 0.391304347826087]
+  - ["DE", 1442034000000, 358, 1752, 1442059200000, 1442030400000, -125, 6075, 2, 10, 0.4090909090909091, 10, 0.43478260869565216]
+  - ["DE", 1442030400000, 373, 2125, 1442098800000, 1442037600000, -125, 6075, 2, 11, 0.45454545454545453, 11, 0.4782608695652174]
+  - ["DE", 1442037600000, 544, 2669, 1442034000000, 1442048400000, -125, 6075, 2, 12, 0.5, 12, 0.5217391304347826]
+  - ["DE", 1442048400000, 811, 3480, 1442030400000, 1442044800000, -125, 6075, 2, 13, 0.5454545454545454, 13, 0.5652173913043478]
+  - ["DE", 1442044800000, 979, 4459, 1442037600000, 1442095200000, -125, 6075, 2, 14, 0.5909090909090909, 14, 0.6086956521739131]
+  - ["DE", 1442095200000, 1007, 5466, 1442048400000, 1442080800000, -125, 6075, 2, 15, 0.6363636363636364, 15, 0.6521739130434783]
+  - ["DE", 1442080800000, 1133, 6599, 1442044800000, 1442055600000, -125, 6075, 2, 16, 0.6818181818181818, 16, 0.6956521739130435]
+  - ["DE", 1442055600000, 1523, 8122, 1442095200000, 1442066400000, -125, 6075, 3, 17, 0.7272727272727273, 17, 0.7391304347826086]
+  - ["DE", 1442066400000, 1577, 9699, 1442080800000, 1442052000000, -125, 6075, 3, 18, 0.7727272727272727, 18, 0.782608695652174]
+  - ["DE", 1442052000000, 1600, 11299, 1442055600000, 1442070000000, -125, 6075, 3, 19, 0.8181818181818182, 19, 0.8260869565217391]
+  - ["DE", 1442070000000, 1666, 12965, 1442066400000, 1442077200000, -125, 6075, 3, 20, 0.8636363636363636, 20, 0.8695652173913043]
+  - ["DE", 1442077200000, 2188, 15153, 1442052000000, 1442091600000, -125, 6075, 3, 21, 0.9090909090909091, 21, 0.9130434782608695]
+  - ["DE", 1442091600000, 4355, 19508, 1442070000000, 1442073600000, -125, 6075, 3, 22, 0.9545454545454546, 22, 0.9565217391304348]
+  - ["DE", 1442073600000, 6075, 25583, 1442077200000, null, -125, 6075, 3, 23, 1.0, 23, 1.0]
+  - ["DK", 1442084400000, -97, -97, null, 1442077200000, -97, 416, 1, 1, 0.0, 1, 0.08333333333333333]
+  - ["DK", 1442077200000, -9, -106, null, 1442048400000, -97, 416, 1, 2, 0.09090909090909091, 2, 0.16666666666666666]
+  - ["DK", 1442048400000, -5, -111, 1442084400000, 1442059200000, -97, 416, 1, 3, 0.18181818181818182, 3, 0.25]
+  - ["DK", 1442059200000, 0, -111, 1442077200000, 1442095200000, -97, 416, 1, 4, 0.2727272727272727, 4, 0.4166666666666667]
+  - ["DK", 1442095200000, 0, -111, 1442048400000, 1442062800000, -97, 416, 2, 4, 0.2727272727272727, 4, 0.4166666666666667]
+  - ["DK", 1442062800000, 1, -110, 1442059200000, 1442037600000, -97, 416, 2, 6, 0.45454545454545453, 5, 0.5]
+  - ["DK", 1442037600000, 10, -100, 1442095200000, 1442044800000, -97, 416, 2, 7, 0.5454545454545454, 6, 0.5833333333333334]
+  - ["DK", 1442044800000, 36, -64, 1442062800000, 1442055600000, -97, 416, 2, 8, 0.6363636363636364, 7, 0.6666666666666666]
+  - ["DK", 1442055600000, 42, -22, 1442037600000, 1442080800000, -97, 416, 3, 9, 0.7272727272727273, 8, 0.75]
+  - ["DK", 1442080800000, 61, 39, 1442044800000, 1442091600000, -97, 416, 3, 10, 0.8181818181818182, 9, 0.8333333333333334]
+  - ["DK", 1442091600000, 139, 178, 1442055600000, 1442066400000, -97, 416, 3, 11, 0.9090909090909091, 10, 0.9166666666666666]
+  - ["DK", 1442066400000, 416, 594, 1442080800000, null, -97, 416, 3, 12, 1.0, 11, 1.0]
+  - ["DO", 1442023200000, 8, 8, null, 1442084400000, 8, 200, 1, 1, 0.0, 1, 0.4]
+  - ["DO", 1442084400000, 8, 16, null, 1442095200000, 8, 200, 1, 1, 0.0, 1, 0.4]
+  - ["DO", 1442095200000, 13, 29, 1442023200000, 1442066400000, 8, 200, 2, 3, 0.5, 2, 0.6]
+  - ["DO", 1442066400000, 35, 64, 1442084400000, 1442073600000, 8, 200, 2, 4, 0.75, 3, 0.8]
+  - ["DO", 1442073600000, 200, 264, 1442095200000, null, 8, 200, 3, 5, 1.0, 4, 1.0]
+  - ["DZ", 1442077200000, -1, -1, null, null, -1, -1, 1, 1, 0.0, 1, 1.0]
+  - ["EC", 1442077200000, -366, -366, null, 1442023200000, -366, 568, 1, 1, 0.0, 1, 0.16666666666666666]
+  - ["EC", 1442023200000, -9, -375, null, 1442030400000, -366, 568, 1, 2, 0.2, 2, 0.3333333333333333]
+  - ["EC", 1442030400000, 0, -375, 1442077200000, 1442095200000, -366, 568, 2, 3, 0.4, 3, 0.5]
+  - ["EC", 1442095200000, 10, -365, 1442023200000, 1442019600000, -366, 568, 2, 4, 0.6, 4, 0.6666666666666666]
+  - ["EC", 1442019600000, 29, -336, 1442030400000, 1442084400000, -366, 568, 3, 5, 0.8, 5, 0.8333333333333334]
+  - ["EC", 1442084400000, 568, 232, 1442095200000, null, -366, 568, 3, 6, 1.0, 6, 1.0]
+  - ["EE", 1442044800000, -19, -19, null, 1442041200000, -19, 37, 1, 1, 0.0, 1, 0.5]
+  - ["EE", 1442041200000, 37, 18, null, null, -19, 37, 2, 2, 1.0, 2, 1.0]
+  - ["EG", 1442073600000, 1, 1, null, 1442055600000, 1, 112, 1, 1, 0.0, 1, 0.2]
+  - ["EG", 1442055600000, 14, 15, null, 1442026800000, 1, 112, 1, 2, 0.25, 2, 0.4]
+  - ["EG", 1442026800000, 16, 31, 1442073600000, 1442091600000, 1, 112, 2, 3, 0.5, 3, 0.6]
+  - ["EG", 1442091600000, 27, 58, 1442055600000, 1442062800000, 1, 112, 2, 4, 0.75, 4, 0.8]
+  - ["EG", 1442062800000, 112, 170, 1442026800000, null, 1, 112, 3, 5, 1.0, 5, 1.0]
+  - ["ES", 1442044800000, -169, -169, null, 1442088000000, -169, 2506, 1, 1, 0.0, 1, 0.05]
+  - ["ES", 1442088000000, -130, -299, null, 1442062800000, -169, 2506, 1, 2, 0.05263157894736842, 2, 0.1]
+  - ["ES", 1442062800000, -71, -370, 1442044800000, 1442034000000, -169, 2506, 1, 3, 0.10526315789473684, 3, 0.15]
+  - ["ES", 1442034000000, -52, -422, 1442088000000, 1442023200000, -169, 2506, 1, 4, 0.15789473684210525, 4, 0.2]
+  - ["ES", 1442023200000, -5, -427, 1442062800000, 1442052000000, -169, 2506, 1, 5, 0.21052631578947367, 5, 0.25]
+  - ["ES", 1442052000000, -4, -431, 1442034000000, 1442037600000, -169, 2506, 1, 6, 0.2631578947368421, 6, 0.3]
+  - ["ES", 1442037600000, 3, -428, 1442023200000, 1442070000000, -169, 2506, 1, 7, 0.3157894736842105, 7, 0.35]
+  - ["ES", 1442070000000, 61, -367, 1442052000000, 1442019600000, -169, 2506, 2, 8, 0.3684210526315789, 8, 0.4]
+  - ["ES", 1442019600000, 103, -264, 1442037600000, 1442041200000, -169, 2506, 2, 9, 0.42105263157894735, 9, 0.45]
+  - ["ES", 1442041200000, 118, -146, 1442070000000, 1442073600000, -169, 2506, 2, 10, 0.47368421052631576, 10, 0.5]
+  - ["ES", 1442073600000, 154, 8, 1442019600000, 1442048400000, -169, 2506, 2, 11, 0.5263157894736842, 11, 0.55]
+  - ["ES", 1442048400000, 158, 166, 1442041200000, 1442084400000, -169, 2506, 2, 12, 0.5789473684210527, 12, 0.6]
+  - ["ES", 1442084400000, 337, 503, 1442073600000, 1442098800000, -169, 2506, 2, 13, 0.631578947368421, 13, 0.65]
+  - ["ES", 1442098800000, 458, 961, 1442048400000, 1442066400000, -169, 2506, 2, 14, 0.6842105263157895, 14, 0.7]
+  - ["ES", 1442066400000, 461, 1422, 1442084400000, 1442055600000, -169, 2506, 3, 15, 0.7368421052631579, 15, 0.75]
+  - ["ES", 1442055600000, 495, 1917, 1442098800000, 1442091600000, -169, 2506, 3, 16, 0.7894736842105263, 16, 0.8]
+  - ["ES", 1442091600000, 700, 2617, 1442066400000, 1442059200000, -169, 2506, 3, 17, 0.8421052631578947, 17, 0.85]
+  - ["ES", 1442059200000, 1086, 3703, 1442055600000, 1442077200000, -169, 2506, 3, 18, 0.8947368421052632, 18, 0.9]
+  - ["ES", 1442077200000, 1240, 4943, 1442091600000, 1442095200000, -169, 2506, 3, 19, 0.9473684210526315, 19, 0.95]
+  - ["ES", 1442095200000, 2506, 7449, 1442059200000, null, -169, 2506, 3, 20, 1.0, 20, 1.0]
+  - ["FI", 1442073600000, -1, -1, null, 1442048400000, -1, 1491, 1, 1, 0.0, 1, 0.08333333333333333]
+  - ["FI", 1442048400000, 12, 11, null, 1442037600000, -1, 1491, 1, 2, 0.09090909090909091, 2, 0.16666666666666666]
+  - ["FI", 1442037600000, 14, 25, 1442073600000, 1442062800000, -1, 1491, 1, 3, 0.18181818181818182, 3, 0.25]
+  - ["FI", 1442062800000, 19, 44, 1442048400000, 1442095200000, -1, 1491, 1, 4, 0.2727272727272727, 4, 0.3333333333333333]
+  - ["FI", 1442095200000, 69, 113, 1442037600000, 1442080800000, -1, 1491, 2, 5, 0.36363636363636365, 5, 0.4166666666666667]
+  - ["FI", 1442080800000, 104, 217, 1442062800000, 1442066400000, -1, 1491, 2, 6, 0.45454545454545453, 6, 0.5]
+  - ["FI", 1442066400000, 183, 400, 1442095200000, 1442052000000, -1, 1491, 2, 7, 0.5454545454545454, 7, 0.5833333333333334]
+  - ["FI", 1442052000000, 186, 586, 1442080800000, 1442077200000, -1, 1491, 2, 8, 0.6363636363636364, 8, 0.6666666666666666]
+  - ["FI", 1442077200000, 200, 786, 1442066400000, 1442059200000, -1, 1491, 3, 9, 0.7272727272727273, 9, 0.75]
+  - ["FI", 1442059200000, 407, 1193, 1442052000000, 1442084400000, -1, 1491, 3, 10, 0.8181818181818182, 10, 0.8333333333333334]
+  - ["FI", 1442084400000, 895, 2088, 1442077200000, 1442030400000, -1, 1491, 3, 11, 0.9090909090909091, 11, 0.9166666666666666]
+  - ["FI", 1442030400000, 1491, 3579, 1442059200000, null, -1, 1491, 3, 12, 1.0, 12, 1.0]
+  - ["FR", 1442077200000, -444, -444, null, 1442016000000, -444, 6643, 1, 1, 0.0, 1, 0.043478260869565216]
+  - ["FR", 1442016000000, -1, -445, null, 1442026800000, -444, 6643, 1, 2, 0.045454545454545456, 2, 0.08695652173913043]
+  - ["FR", 1442026800000, 86, -359, 1442077200000, 1442095200000, -444, 6643, 1, 3, 0.09090909090909091, 3, 0.13043478260869565]
+  - ["FR", 1442095200000, 87, -272, 1442016000000, 1442098800000, -444, 6643, 1, 4, 0.13636363636363635, 4, 0.17391304347826086]
+  - ["FR", 1442098800000, 136, -136, 1442026800000, 1442044800000, -444, 6643, 1, 5, 0.18181818181818182, 5, 0.21739130434782608]
+  - ["FR", 1442044800000, 172, 36, 1442095200000, 1442055600000, -444, 6643, 1, 6, 0.22727272727272727, 6, 0.2608695652173913]
+  - ["FR", 1442055600000, 463, 499, 1442098800000, 1442070000000, -444, 6643, 1, 7, 0.2727272727272727, 7, 0.30434782608695654]
+  - ["FR", 1442070000000, 474, 973, 1442044800000, 1442034000000, -444, 6643, 1, 8, 0.3181818181818182, 8, 0.34782608695652173]
+  - ["FR", 1442034000000, 476, 1449, 1442055600000, 1442080800000, -444, 6643, 2, 9, 0.36363636363636365, 9, 0.391304347826087]
+  - ["FR", 1442080800000, 557, 2006, 1442070000000, 1442019600000, -444, 6643, 2, 10, 0.4090909090909091, 10, 0.43478260869565216]
+  - ["FR", 1442019600000, 585, 2591, 1442034000000, 1442041200000, -444, 6643, 2, 11, 0.45454545454545453, 11, 0.4782608695652174]
+  - ["FR", 1442041200000, 604, 3195, 1442080800000, 1442023200000, -444, 6643, 2, 12, 0.5, 12, 0.5217391304347826]
+  - ["FR", 1442023200000, 628, 3823, 1442019600000, 1442052000000, -444, 6643, 2, 13, 0.5454545454545454, 13, 0.5652173913043478]
+  - ["FR", 1442052000000, 637, 4460, 1442041200000, 1442091600000, -444, 6643, 2, 14, 0.5909090909090909, 14, 0.6086956521739131]
+  - ["FR", 1442091600000, 741, 5201, 1442023200000, 1442088000000, -444, 6643, 2, 15, 0.6363636363636364, 15, 0.6521739130434783]
+  - ["FR", 1442088000000, 1872, 7073, 1442052000000, 1442066400000, -444, 6643, 2, 16, 0.6818181818181818, 16, 0.6956521739130435]
+  - ["FR", 1442066400000, 2516, 9589, 1442091600000, 1442048400000, -444, 6643, 3, 17, 0.7272727272727273, 17, 0.7391304347826086]
+  - ["FR", 1442048400000, 3027, 12616, 1442088000000, 1442073600000, -444, 6643, 3, 18, 0.7727272727272727, 18, 0.782608695652174]
+  - ["FR", 1442073600000, 3522, 16138, 1442066400000, 1442037600000, -444, 6643, 3, 19, 0.8181818181818182, 19, 0.8260869565217391]
+  - ["FR", 1442037600000, 4174, 20312, 1442048400000, 1442059200000, -444, 6643, 3, 20, 0.8636363636363636, 20, 0.8695652173913043]
+  - ["FR", 1442059200000, 4650, 24962, 1442073600000, 1442062800000, -444, 6643, 3, 21, 0.9090909090909091, 21, 0.9130434782608695]
+  - ["FR", 1442062800000, 5676, 30638, 1442037600000, 1442084400000, -444, 6643, 3, 22, 0.9545454545454546, 22, 0.9565217391304348]
+  - ["FR", 1442084400000, 6643, 37281, 1442059200000, null, -444, 6643, 3, 23, 1.0, 23, 1.0]
+  - ["GB", 1442016000000, -44, -44, null, 1442034000000, -44, 16111, 1, 1, 0.0, 1, 0.041666666666666664]
+  - ["GB", 1442034000000, -12, -56, null, 1442044800000, -44, 16111, 1, 2, 0.043478260869565216, 2, 0.08333333333333333]
+  - ["GB", 1442044800000, 32, -24, 1442016000000, 1442041200000, -44, 16111, 1, 3, 0.08695652173913043, 3, 0.125]
+  - ["GB", 1442041200000, 42, 18, 1442034000000, 1442098800000, -44, 16111, 1, 4, 0.13043478260869565, 4, 0.16666666666666666]
+  - ["GB", 1442098800000, 49, 67, 1442044800000, 1442019600000, -44, 16111, 1, 5, 0.17391304347826086, 5, 0.20833333333333334]
+  - ["GB", 1442019600000, 54, 121, 1442041200000, 1442052000000, -44, 16111, 1, 6, 0.21739130434782608, 6, 0.25]
+  - ["GB", 1442052000000, 168, 289, 1442098800000, 1442095200000, -44, 16111, 1, 7, 0.2608695652173913, 7, 0.2916666666666667]
+  - ["GB", 1442095200000, 238, 527, 1442019600000, 1442026800000, -44, 16111, 1, 8, 0.30434782608695654, 8, 0.3333333333333333]
+  - ["GB", 1442026800000, 339, 866, 1442052000000, 1442070000000, -44, 16111, 2, 9, 0.34782608695652173, 9, 0.375]
+  - ["GB", 1442070000000, 374, 1240, 1442095200000, 1442084400000, -44, 16111, 2, 10, 0.391304347826087, 10, 0.4166666666666667]
+  - ["GB", 1442084400000, 384, 1624, 1442026800000, 1442055600000, -44, 16111, 2, 11, 0.43478260869565216, 11, 0.4583333333333333]
+  - ["GB", 1442055600000, 453, 2077, 1442070000000, 1442037600000, -44, 16111, 2, 12, 0.4782608695652174, 12, 0.5]
+  - ["GB", 1442037600000, 544, 2621, 1442084400000, 1442073600000, -44, 16111, 2, 13, 0.5217391304347826, 13, 0.5416666666666666]
+  - ["GB", 1442073600000, 648, 3269, 1442055600000, 1442066400000, -44, 16111, 2, 14, 0.5652173913043478, 14, 0.5833333333333334]
+  - ["GB", 1442066400000, 671, 3940, 1442037600000, 1442048400000, -44, 16111, 2, 15, 0.6086956521739131, 15, 0.625]
+  - ["GB", 1442048400000, 740, 4680, 1442073600000, 1442091600000, -44, 16111, 2, 16, 0.6521739130434783, 16, 0.6666666666666666]
+  - ["GB", 1442091600000, 811, 5491, 1442066400000, 1442077200000, -44, 16111, 3, 17, 0.6956521739130435, 17, 0.7083333333333334]
+  - ["GB", 1442077200000, 1135, 6626, 1442048400000, 1442080800000, -44, 16111, 3, 18, 0.7391304347826086, 18, 0.75]
+  - ["GB", 1442080800000, 1444, 8070, 1442091600000, 1442088000000, -44, 16111, 3, 19, 0.782608695652174, 19, 0.7916666666666666]
+  - ["GB", 1442088000000, 1593, 9663, 1442077200000, 1442023200000, -44, 16111, 3, 20, 0.8260869565217391, 20, 0.8333333333333334]
+  - ["GB", 1442023200000, 1816, 11479, 1442080800000, 1442030400000, -44, 16111, 3, 21, 0.8695652173913043, 21, 0.875]
+  - ["GB", 1442030400000, 2524, 14003, 1442088000000, 1442062800000, -44, 16111, 3, 22, 0.9130434782608695, 22, 0.9166666666666666]
+  - ["GB", 1442062800000, 5743, 19746, 1442023200000, 1442059200000, -44, 16111, 3, 23, 0.9565217391304348, 23, 0.9583333333333334]
+  - ["GB", 1442059200000, 16111, 35857, 1442030400000, null, -44, 16111, 3, 24, 1.0, 24, 1.0]
+  - ["GE", 1442052000000, -108, -108, null, 1442080800000, -108, 16, 1, 1, 0.0, 1, 0.25]
+  - ["GE", 1442080800000, -27, -135, null, 1442044800000, -108, 16, 1, 2, 0.3333333333333333, 2, 0.5]
+  - ["GE", 1442044800000, -21, -156, 1442052000000, 1442062800000, -108, 16, 2, 3, 0.6666666666666666, 3, 0.75]
+  - ["GE", 1442062800000, 16, -140, 1442080800000, null, -108, 16, 3, 4, 1.0, 4, 1.0]
+  - ["GH", 1442088000000, 0, 0, null, null, 0, 0, 1, 1, 0.0, 1, 1.0]
+  - ["GR", 1442073600000, -314, -314, null, 1442048400000, -314, 179, 1, 1, 0.0, 1, 0.1]
+  - ["GR", 1442048400000, -26, -340, null, 1442034000000, -314, 179, 1, 2, 0.1111111111111111, 2, 0.2]
+  - ["GR", 1442034000000, 0, -340, 1442073600000, 1442070000000, -314, 179, 1, 3, 0.2222222222222222, 3, 0.3]
+  - ["GR", 1442070000000, 2, -338, 1442048400000, 1442041200000, -314, 179, 1, 4, 0.3333333333333333, 4, 0.4]
+  - ["GR", 1442041200000, 7, -331, 1442034000000, 1442062800000, -314, 179, 2, 5, 0.4444444444444444, 5, 0.5]
+  - ["GR", 1442062800000, 8, -323, 1442070000000, 1442019600000, -314, 179, 2, 6, 0.5555555555555556, 6, 0.6]
+  - ["GR", 1442019600000, 82, -241, 1442041200000, 1442080800000, -314, 179, 2, 7, 0.6666666666666666, 7, 0.7]
+  - ["GR", 1442080800000, 88, -153, 1442062800000, 1442091600000, -314, 179, 3, 8, 0.7777777777777778, 8, 0.8]
+  - ["GR", 1442091600000, 123, -30, 1442019600000, 1442084400000, -314, 179, 3, 9, 0.8888888888888888, 9, 0.9]
+  - ["GR", 1442084400000, 179, 149, 1442080800000, null, -314, 179, 3, 10, 1.0, 10, 1.0]
+  - ["GT", 1442023200000, -167, -167, null, 1442098800000, -167, 173, 1, 1, 0.0, 1, 0.3333333333333333]
+  - ["GT", 1442098800000, 1, -166, null, 1442026800000, -167, 173, 2, 2, 0.5, 2, 0.6666666666666666]
+  - ["GT", 1442026800000, 173, 7, 1442023200000, null, -167, 173, 3, 3, 1.0, 3, 1.0]
+  - ["HK", 1442026800000, -211, -211, null, 1442019600000, -211, 5545, 1, 1, 0.0, 1, 0.05263157894736842]
+  - ["HK", 1442019600000, -113, -324, null, 1442041200000, -211, 5545, 1, 2, 0.05555555555555555, 2, 0.10526315789473684]
+  - ["HK", 1442041200000, -15, -339, 1442026800000, 1442091600000, -211, 5545, 1, 3, 0.1111111111111111, 3, 0.15789473684210525]
+  - ["HK", 1442091600000, -3, -342, 1442019600000, 1442095200000, -211, 5545, 1, 4, 0.16666666666666666, 4, 0.21052631578947367]
+  - ["HK", 1442095200000, -1, -343, 1442041200000, 1442080800000, -211, 5545, 1, 5, 0.2222222222222222, 5, 0.2631578947368421]
+  - ["HK", 1442080800000, 0, -343, 1442091600000, 1442048400000, -211, 5545, 1, 6, 0.2777777777777778, 6, 0.3157894736842105]
+  - ["HK", 1442048400000, 1, -342, 1442095200000, 1442062800000, -211, 5545, 1, 7, 0.3333333333333333, 7, 0.42105263157894735]
+  - ["HK", 1442062800000, 1, -341, 1442080800000, 1442059200000, -211, 5545, 2, 7, 0.3333333333333333, 7, 0.42105263157894735]
+  - ["HK", 1442059200000, 2, -339, 1442048400000, 1442052000000, -211, 5545, 2, 9, 0.4444444444444444, 8, 0.47368421052631576]
+  - ["HK", 1442052000000, 15, -324, 1442062800000, 1442044800000, -211, 5545, 2, 10, 0.5, 9, 0.5263157894736842]
+  - ["HK", 1442044800000, 21, -303, 1442059200000, 1442066400000, -211, 5545, 2, 11, 0.5555555555555556, 10, 0.5789473684210527]
+  - ["HK", 1442066400000, 39, -264, 1442052000000, 1442030400000, -211, 5545, 2, 12, 0.6111111111111112, 11, 0.631578947368421]
+  - ["HK", 1442030400000, 157, -107, 1442044800000, 1442070000000, -211, 5545, 2, 13, 0.6666666666666666, 12, 0.6842105263157895]
+  - ["HK", 1442070000000, 314, 207, 1442066400000, 1442037600000, -211, 5545, 3, 14, 0.7222222222222222, 13, 0.7368421052631579]
+  - ["HK", 1442037600000, 636, 843, 1442030400000, 1442055600000, -211, 5545, 3, 15, 0.7777777777777778, 14, 0.7894736842105263]
+  - ["HK", 1442055600000, 804, 1647, 1442070000000, 1442034000000, -211, 5545, 3, 16, 0.8333333333333334, 15, 0.8421052631578947]
+  - ["HK", 1442034000000, 1137, 2784, 1442037600000, 1442023200000, -211, 5545, 3, 17, 0.8888888888888888, 16, 0.8947368421052632]
+  - ["HK", 1442023200000, 2414, 5198, 1442055600000, 1442073600000, -211, 5545, 3, 18, 0.9444444444444444, 17, 0.9473684210526315]
+  - ["HK", 1442073600000, 5545, 10743, 1442034000000, null, -211, 5545, 3, 19, 1.0, 18, 1.0]
+  - ["HN", 1442026800000, -1, -1, null, null, -1, -1, 1, 1, 0.0, 1, 1.0]
+  - ["HR", 1442084400000, -10, -10, null, 1442073600000, -10, 220, 1, 1, 0.0, 1, 0.16666666666666666]
+  - ["HR", 1442073600000, 0, -10, null, 1442070000000, -10, 220, 1, 2, 0.2, 2, 0.3333333333333333]
+  - ["HR", 1442070000000, 32, 22, 1442084400000, 1442077200000, -10, 220, 2, 3, 0.4, 3, 0.5]
+  - ["HR", 1442077200000, 58, 80, 1442073600000, 1442088000000, -10, 220, 2, 4, 0.6, 4, 0.6666666666666666]
+  - ["HR", 1442088000000, 82, 162, 1442070000000, 1442080800000, -10, 220, 3, 5, 0.8, 5, 0.8333333333333334]
+  - ["HR", 1442080800000, 220, 382, 1442077200000, null, -10, 220, 3, 6, 1.0, 6, 1.0]
+  - ["HU", 1442088000000, -71, -71, null, 1442091600000, -71, 547, 1, 1, 0.0, 1, 0.07692307692307693]
+  - ["HU", 1442091600000, -5, -76, null, 1442055600000, -71, 547, 1, 2, 0.08333333333333333, 2, 0.15384615384615385]
+  - ["HU", 1442055600000, -2, -78, 1442088000000, 1442019600000, -71, 547, 1, 3, 0.16666666666666666, 3, 0.23076923076923078]
+  - ["HU", 1442019600000, 46, -32, 1442091600000, 1442062800000, -71, 547, 1, 4, 0.25, 4, 0.3076923076923077]
+  - ["HU", 1442062800000, 50, 18, 1442055600000, 1442041200000, -71, 547, 1, 5, 0.3333333333333333, 5, 0.38461538461538464]
+  - ["HU", 1442041200000, 91, 109, 1442019600000, 1442098800000, -71, 547, 2, 6, 0.4166666666666667, 6, 0.46153846153846156]
+  - ["HU", 1442098800000, 110, 219, 1442062800000, 1442084400000, -71, 547, 2, 7, 0.5, 7, 0.5384615384615384]
+  - ["HU", 1442084400000, 141, 360, 1442041200000, 1442037600000, -71, 547, 2, 8, 0.5833333333333334, 8, 0.6153846153846154]
+  - ["HU", 1442037600000, 197, 557, 1442098800000, 1442080800000, -71, 547, 2, 9, 0.6666666666666666, 9, 0.6923076923076923]
+  - ["HU", 1442080800000, 242, 799, 1442084400000, 1442095200000, -71, 547, 3, 10, 0.75, 10, 0.7692307692307693]
+  - ["HU", 1442095200000, 271, 1070, 1442037600000, 1442048400000, -71, 547, 3, 11, 0.8333333333333334, 11, 0.8461538461538461]
+  - ["HU", 1442048400000, 499, 1569, 1442080800000, 1442044800000, -71, 547, 3, 12, 0.9166666666666666, 12, 0.9230769230769231]
+  - ["HU", 1442044800000, 547, 2116, 1442095200000, null, -71, 547, 3, 13, 1.0, 13, 1.0]
+  - ["ID", 1442026800000, -416, -416, null, 1442044800000, -416, 279, 1, 1, 0.0, 1, 0.07692307692307693]
+  - ["ID", 1442044800000, -388, -804, null, 1442041200000, -416, 279, 1, 2, 0.08333333333333333, 2, 0.15384615384615385]
+  - ["ID", 1442041200000, 2, -802, 1442026800000, 1442098800000, -416, 279, 1, 3, 0.16666666666666666, 3, 0.23076923076923078]
+  - ["ID", 1442098800000, 13, -789, 1442044800000, 1442037600000, -416, 279, 1, 4, 0.25, 4, 0.3076923076923077]
+  - ["ID", 1442037600000, 14, -775, 1442041200000, 1442055600000, -416, 279, 1, 5, 0.3333333333333333, 5, 0.38461538461538464]
+  - ["ID", 1442055600000, 16, -759, 1442098800000, 1442059200000, -416, 279, 2, 6, 0.4166666666666667, 6, 0.46153846153846156]
+  - ["ID", 1442059200000, 17, -742, 1442037600000, 1442034000000, -416, 279, 2, 7, 0.5, 7, 0.5384615384615384]
+  - ["ID", 1442034000000, 19, -723, 1442055600000, 1442095200000, -416, 279, 2, 8, 0.5833333333333334, 8, 0.6153846153846154]
+  - ["ID", 1442095200000, 20, -703, 1442059200000, 1442091600000, -416, 279, 2, 9, 0.6666666666666666, 9, 0.6923076923076923]
+  - ["ID", 1442091600000, 21, -682, 1442034000000, 1442070000000, -416, 279, 3, 10, 0.75, 10, 0.7692307692307693]
+  - ["ID", 1442070000000, 42, -640, 1442095200000, 1442023200000, -416, 279, 3, 11, 0.8333333333333334, 11, 0.8461538461538461]
+  - ["ID", 1442023200000, 106, -534, 1442091600000, 1442030400000, -416, 279, 3, 12, 0.9166666666666666, 12, 0.9230769230769231]
+  - ["ID", 1442030400000, 279, -255, 1442070000000, null, -416, 279, 3, 13, 1.0, 13, 1.0]
+  - ["IE", 1442070000000, -100, -100, null, 1442091600000, -100, 1062, 1, 1, 0.0, 1, 0.125]
+  - ["IE", 1442091600000, -71, -171, null, 1442026800000, -100, 1062, 1, 2, 0.14285714285714285, 2, 0.25]
+  - ["IE", 1442026800000, 1, -170, 1442070000000, 1442030400000, -100, 1062, 1, 3, 0.2857142857142857, 3, 0.5]
+  - ["IE", 1442030400000, 1, -169, 1442091600000, 1442048400000, -100, 1062, 2, 3, 0.2857142857142857, 3, 0.5]
+  - ["IE", 1442048400000, 27, -142, 1442026800000, 1442077200000, -100, 1062, 2, 5, 0.5714285714285714, 4, 0.625]
+  - ["IE", 1442077200000, 403, 261, 1442030400000, 1442084400000, -100, 1062, 2, 6, 0.7142857142857143, 5, 0.75]
+  - ["IE", 1442084400000, 819, 1080, 1442048400000, 1442066400000, -100, 1062, 3, 7, 0.8571428571428571, 6, 0.875]
+  - ["IE", 1442066400000, 1062, 2142, 1442077200000, null, -100, 1062, 3, 8, 1.0, 7, 1.0]
+  - ["IL", 1442095200000, 0, 0, null, 1442066400000, 0, 2745, 1, 1, 0.0, 1, 0.0625]
+  - ["IL", 1442066400000, 3, 3, null, 1442098800000, 0, 2745, 1, 2, 0.06666666666666667, 2, 0.1875]
+  - ["IL", 1442098800000, 3, 6, 1442095200000, 1442055600000, 0, 2745, 1, 2, 0.06666666666666667, 2, 0.1875]
+  - ["IL", 1442055600000, 4, 10, 1442066400000, 1442048400000, 0, 2745, 1, 4, 0.2, 3, 0.25]
+  - ["IL", 1442048400000, 25, 35, 1442098800000, 1442073600000, 0, 2745, 1, 5, 0.26666666666666666, 4, 0.3125]
+  - ["IL", 1442073600000, 31, 66, 1442055600000, 1442041200000, 0, 2745, 1, 6, 0.3333333333333333, 5, 0.375]
+  - ["IL", 1442041200000, 35, 101, 1442048400000, 1442070000000, 0, 2745, 2, 7, 0.4, 6, 0.4375]
+  - ["IL", 1442070000000, 49, 150, 1442073600000, 1442080800000, 0, 2745, 2, 8, 0.4666666666666667, 7, 0.5]
+  - ["IL", 1442080800000, 88, 238, 1442041200000, 1442062800000, 0, 2745, 2, 9, 0.5333333333333333, 8, 0.5625]
+  - ["IL", 1442062800000, 180, 418, 1442070000000, 1442077200000, 0, 2745, 2, 10, 0.6, 9, 0.625]
+  - ["IL", 1442077200000, 187, 605, 1442080800000, 1442044800000, 0, 2745, 2, 11, 0.6666666666666666, 10, 0.6875]
+  - ["IL", 1442044800000, 218, 823, 1442062800000, 1442091600000, 0, 2745, 3, 12, 0.7333333333333333, 11, 0.75]
+  - ["IL", 1442091600000, 707, 1530, 1442077200000, 1442084400000, 0, 2745, 3, 13, 0.8, 12, 0.8125]
+  - ["IL", 1442084400000, 1137, 2667, 1442044800000, 1442059200000, 0, 2745, 3, 14, 0.8666666666666667, 13, 0.875]
+  - ["IL", 1442059200000, 1205, 3872, 1442091600000, 1442052000000, 0, 2745, 3, 15, 0.9333333333333333, 14, 0.9375]
+  - ["IL", 1442052000000, 2745, 6617, 1442084400000, null, 0, 2745, 3, 16, 1.0, 15, 1.0]
+  - ["IN", 1442023200000, -142, -142, null, 1442080800000, -142, 12091, 1, 1, 0.0, 1, 0.045454545454545456]
+  - ["IN", 1442080800000, 0, -142, null, 1442016000000, -142, 12091, 1, 2, 0.047619047619047616, 2, 0.09090909090909091]
+  - ["IN", 1442016000000, 1, -141, 1442023200000, 1442095200000, -142, 12091, 1, 3, 0.09523809523809523, 3, 0.13636363636363635]
+  - ["IN", 1442095200000, 4, -137, 1442080800000, 1442019600000, -142, 12091, 1, 4, 0.14285714285714285, 4, 0.18181818181818182]
+  - ["IN", 1442019600000, 38, -99, 1442016000000, 1442041200000, -142, 12091, 1, 5, 0.19047619047619047, 5, 0.22727272727272727]
+  - ["IN", 1442041200000, 80, -19, 1442095200000, 1442066400000, -142, 12091, 1, 6, 0.23809523809523808, 6, 0.2727272727272727]
+  - ["IN", 1442066400000, 116, 97, 1442019600000, 1442088000000, -142, 12091, 1, 7, 0.2857142857142857, 7, 0.3181818181818182]
+  - ["IN", 1442088000000, 121, 218, 1442041200000, 1442037600000, -142, 12091, 1, 8, 0.3333333333333333, 8, 0.36363636363636365]
+  - ["IN", 1442037600000, 135, 353, 1442066400000, 1442055600000, -142, 12091, 2, 9, 0.38095238095238093, 9, 0.4090909090909091]
+  - ["IN", 1442055600000, 166, 519, 1442088000000, 1442084400000, -142, 12091, 2, 10, 0.42857142857142855, 10, 0.45454545454545453]
+  - ["IN", 1442084400000, 187, 706, 1442037600000, 1442048400000, -142, 12091, 2, 11, 0.47619047619047616, 11, 0.5]
+  - ["IN", 1442048400000, 262, 968, 1442055600000, 1442052000000, -142, 12091, 2, 12, 0.5238095238095238, 12, 0.5454545454545454]
+  - ["IN", 1442052000000, 534, 1502, 1442084400000, 1442059200000, -142, 12091, 2, 13, 0.5714285714285714, 13, 0.5909090909090909]
+  - ["IN", 1442059200000, 708, 2210, 1442048400000, 1442026800000, -142, 12091, 2, 14, 0.6190476190476191, 14, 0.6363636363636364]
+  - ["IN", 1442026800000, 974, 3184, 1442052000000, 1442073600000, -142, 12091, 2, 15, 0.6666666666666666, 15, 0.6818181818181818]
+  - ["IN", 1442073600000, 1170, 4354, 1442059200000, 1442034000000, -142, 12091, 3, 16, 0.7142857142857143, 16, 0.7272727272727273]
+  - ["IN", 1442034000000, 1350, 5704, 1442026800000, 1442030400000, -142, 12091, 3, 17, 0.7619047619047619, 17, 0.7727272727272727]
+  - ["IN", 1442030400000, 1448, 7152, 1442073600000, 1442062800000, -142, 12091, 3, 18, 0.8095238095238095, 18, 0.8181818181818182]
+  - ["IN", 1442062800000, 1547, 8699, 1442034000000, 1442044800000, -142, 12091, 3, 19, 0.8571428571428571, 19, 0.8636363636363636]
+  - ["IN", 1442044800000, 2677, 11376, 1442030400000, 1442077200000, -142, 12091, 3, 20, 0.9047619047619048, 20, 0.9090909090909091]
+  - ["IN", 1442077200000, 5699, 17075, 1442062800000, 1442070000000, -142, 12091, 3, 21, 0.9523809523809523, 21, 0.9545454545454546]
+  - ["IN", 1442070000000, 12091, 29166, 1442044800000, null, -142, 12091, 3, 22, 1.0, 22, 1.0]
+  - ["IQ", 1442095200000, -2, -2, null, 1442041200000, -2, 6, 1, 1, 0.0, 1, 0.25]
+  - ["IQ", 1442041200000, -1, -3, null, 1442052000000, -2, 6, 1, 2, 0.3333333333333333, 2, 0.5]
+  - ["IQ", 1442052000000, 0, -3, 1442095200000, 1442044800000, -2, 6, 2, 3, 0.6666666666666666, 3, 0.75]
+  - ["IQ", 1442044800000, 6, 3, 1442041200000, null, -2, 6, 3, 4, 1.0, 4, 1.0]
+  - ["IR", 1442073600000, -193, -193, null, 1442055600000, -193, 1455, 1, 1, 0.0, 1, 0.07692307692307693]
+  - ["IR", 1442055600000, -124, -317, null, 1442041200000, -193, 1455, 1, 2, 0.08333333333333333, 2, 0.15384615384615385]
+  - ["IR", 1442041200000, -79, -396, 1442073600000, 1442077200000, -193, 1455, 1, 3, 0.16666666666666666, 3, 0.23076923076923078]
+  - ["IR", 1442077200000, -34, -430, 1442055600000, 1442034000000, -193, 1455, 1, 4, 0.25, 4, 0.3076923076923077]
+  - ["IR", 1442034000000, -8, -438, 1442041200000, 1442026800000, -193, 1455, 1, 5, 0.3333333333333333, 5, 0.38461538461538464]
+  - ["IR", 1442026800000, 0, -438, 1442077200000, 1442091600000, -193, 1455, 2, 6, 0.4166666666666667, 6, 0.5384615384615384]
+  - ["IR", 1442091600000, 0, -438, 1442034000000, 1442080800000, -193, 1455, 2, 6, 0.4166666666666667, 6, 0.5384615384615384]
+  - ["IR", 1442080800000, 131, -307, 1442026800000, 1442052000000, -193, 1455, 2, 8, 0.5833333333333334, 7, 0.6153846153846154]
+  - ["IR", 1442052000000, 155, -152, 1442091600000, 1442044800000, -193, 1455, 2, 9, 0.6666666666666666, 8, 0.6923076923076923]
+  - ["IR", 1442044800000, 306, 154, 1442080800000, 1442030400000, -193, 1455, 3, 10, 0.75, 9, 0.7692307692307693]
+  - ["IR", 1442030400000, 375, 529, 1442052000000, 1442088000000, -193, 1455, 3, 11, 0.8333333333333334, 10, 0.8461538461538461]
+  - ["IR", 1442088000000, 714, 1243, 1442044800000, 1442059200000, -193, 1455, 3, 12, 0.9166666666666666, 11, 0.9230769230769231]
+  - ["IR", 1442059200000, 1455, 2698, 1442030400000, null, -193, 1455, 3, 13, 1.0, 12, 1.0]
+  - ["IT", 1442030400000, -17, -17, null, 1442037600000, -17, 6240, 1, 1, 0.0, 1, 0.041666666666666664]
+  - ["IT", 1442037600000, -9, -26, null, 1442016000000, -17, 6240, 1, 2, 0.043478260869565216, 2, 0.08333333333333333]
+  - ["IT", 1442016000000, 0, -26, 1442030400000, 1442041200000, -17, 6240, 1, 3, 0.08695652173913043, 3, 0.125]
+  - ["IT", 1442041200000, 20, -6, 1442037600000, 1442070000000, -17, 6240, 1, 4, 0.13043478260869565, 4, 0.16666666666666666]
+  - ["IT", 1442070000000, 81, 75, 1442016000000, 1442023200000, -17, 6240, 1, 5, 0.17391304347826086, 5, 0.20833333333333334]
+  - ["IT", 1442023200000, 111, 186, 1442041200000, 1442019600000, -17, 6240, 1, 6, 0.21739130434782608, 6, 0.25]
+  - ["IT", 1442019600000, 183, 369, 1442070000000, 1442026800000, -17, 6240, 1, 7, 0.2608695652173913, 7, 0.2916666666666667]
+  - ["IT", 1442026800000, 222, 591, 1442023200000, 1442091600000, -17, 6240, 1, 8, 0.30434782608695654, 8, 0.3333333333333333]
+  - ["IT", 1442091600000, 351, 942, 1442019600000, 1442059200000, -17, 6240, 2, 9, 0.34782608695652173, 9, 0.375]
+  - ["IT", 1442059200000, 542, 1484, 1442026800000, 1442098800000, -17, 6240, 2, 10, 0.391304347826087, 10, 0.4166666666666667]
+  - ["IT", 1442098800000, 565, 2049, 1442091600000, 1442048400000, -17, 6240, 2, 11, 0.43478260869565216, 11, 0.4583333333333333]
+  - ["IT", 1442048400000, 676, 2725, 1442059200000, 1442034000000, -17, 6240, 2, 12, 0.4782608695652174, 12, 0.5]
+  - ["IT", 1442034000000, 1006, 3731, 1442098800000, 1442044800000, -17, 6240, 2, 13, 0.5217391304347826, 13, 0.5416666666666666]
+  - ["IT", 1442044800000, 1483, 5214, 1442048400000, 1442052000000, -17, 6240, 2, 14, 0.5652173913043478, 14, 0.5833333333333334]
+  - ["IT", 1442052000000, 1880, 7094, 1442034000000, 1442062800000, -17, 6240, 2, 15, 0.6086956521739131, 15, 0.625]
+  - ["IT", 1442062800000, 1938, 9032, 1442044800000, 1442077200000, -17, 6240, 2, 16, 0.6521739130434783, 16, 0.6666666666666666]
+  - ["IT", 1442077200000, 2188, 11220, 1442052000000, 1442073600000, -17, 6240, 3, 17, 0.6956521739130435, 17, 0.7083333333333334]
+  - ["IT", 1442073600000, 2586, 13806, 1442062800000, 1442084400000, -17, 6240, 3, 18, 0.7391304347826086, 18, 0.75]
+  - ["IT", 1442084400000, 2660, 16466, 1442077200000, 1442095200000, -17, 6240, 3, 19, 0.782608695652174, 19, 0.7916666666666666]
+  - ["IT", 1442095200000, 2940, 19406, 1442073600000, 1442088000000, -17, 6240, 3, 20, 0.8260869565217391, 20, 0.8333333333333334]
+  - ["IT", 1442088000000, 3746, 23152, 1442084400000, 1442066400000, -17, 6240, 3, 21, 0.8695652173913043, 21, 0.875]
+  - ["IT", 1442066400000, 4155, 27307, 1442095200000, 1442080800000, -17, 6240, 3, 22, 0.9130434782608695, 22, 0.9166666666666666]
+  - ["IT", 1442080800000, 5544, 32851, 1442088000000, 1442055600000, -17, 6240, 3, 23, 0.9565217391304348, 23, 0.9583333333333334]
+  - ["IT", 1442055600000, 6240, 39091, 1442066400000, null, -17, 6240, 3, 24, 1.0, 24, 1.0]
+  - ["JM", 1442070000000, 30, 30, null, null, 30, 30, 1, 1, 0.0, 1, 1.0]
+  - ["JO", 1442055600000, -2, -2, null, 1442059200000, -2, 4, 1, 1, 0.0, 1, 0.3333333333333333]
+  - ["JO", 1442059200000, 0, -2, null, 1442080800000, -2, 4, 2, 2, 0.5, 2, 0.6666666666666666]
+  - ["JO", 1442080800000, 4, 2, 1442055600000, null, -2, 4, 3, 3, 1.0, 3, 1.0]
+  - ["JP", 1442016000000, -113, -113, null, 1442059200000, -113, 2789, 1, 1, 0.0, 1, 0.041666666666666664]
+  - ["JP", 1442059200000, -85, -198, null, 1442098800000, -113, 2789, 1, 2, 0.043478260869565216, 2, 0.08333333333333333]
+  - ["JP", 1442098800000, -6, -204, 1442016000000, 1442095200000, -113, 2789, 1, 3, 0.08695652173913043, 3, 0.125]
+  - ["JP", 1442095200000, 0, -204, 1442059200000, 1442084400000, -113, 2789, 1, 4, 0.13043478260869565, 4, 0.16666666666666666]
+  - ["JP", 1442084400000, 13, -191, 1442098800000, 1442077200000, -113, 2789, 1, 5, 0.17391304347826086, 5, 0.20833333333333334]
+  - ["JP", 1442077200000, 51, -140, 1442095200000, 1442088000000, -113, 2789, 1, 6, 0.21739130434782608, 6, 0.25]
+  - ["JP", 1442088000000, 57, -83, 1442084400000, 1442070000000, -113, 2789, 1, 7, 0.2608695652173913, 7, 0.2916666666666667]
+  - ["JP", 1442070000000, 79, -4, 1442077200000, 1442066400000, -113, 2789, 1, 8, 0.30434782608695654, 8, 0.3333333333333333]
+  - ["JP", 1442066400000, 167, 163, 1442088000000, 1442091600000, -113, 2789, 2, 9, 0.34782608695652173, 9, 0.375]
+  - ["JP", 1442091600000, 228, 391, 1442070000000, 1442080800000, -113, 2789, 2, 10, 0.391304347826087, 10, 0.4166666666666667]
+  - ["JP", 1442080800000, 420, 811, 1442066400000, 1442062800000, -113, 2789, 2, 11, 0.43478260869565216, 11, 0.4583333333333333]
+  - ["JP", 1442062800000, 803, 1614, 1442091600000, 1442030400000, -113, 2789, 2, 12, 0.4782608695652174, 12, 0.5]
+  - ["JP", 1442030400000, 805, 2419, 1442080800000, 1442034000000, -113, 2789, 2, 13, 0.5217391304347826, 13, 0.5416666666666666]
+  - ["JP", 1442034000000, 910, 3329, 1442062800000, 1442055600000, -113, 2789, 2, 14, 0.5652173913043478, 14, 0.5833333333333334]
+  - ["JP", 1442055600000, 998, 4327, 1442030400000, 1442026800000, -113, 2789, 2, 15, 0.6086956521739131, 15, 0.625]
+  - ["JP", 1442026800000, 1035, 5362, 1442034000000, 1442073600000, -113, 2789, 2, 16, 0.6521739130434783, 16, 0.6666666666666666]
+  - ["JP", 1442073600000, 1162, 6524, 1442055600000, 1442041200000, -113, 2789, 3, 17, 0.6956521739130435, 17, 0.7083333333333334]
+  - ["JP", 1442041200000, 1373, 7897, 1442026800000, 1442044800000, -113, 2789, 3, 18, 0.7391304347826086, 18, 0.75]
+  - ["JP", 1442044800000, 1569, 9466, 1442073600000, 1442023200000, -113, 2789, 3, 19, 0.782608695652174, 19, 0.7916666666666666]
+  - ["JP", 1442023200000, 1959, 11425, 1442041200000, 1442048400000, -113, 2789, 3, 20, 0.8260869565217391, 20, 0.8333333333333334]
+  - ["JP", 1442048400000, 1981, 13406, 1442044800000, 1442019600000, -113, 2789, 3, 21, 0.8695652173913043, 21, 0.875]
+  - ["JP", 1442019600000, 2002, 15408, 1442023200000, 1442037600000, -113, 2789, 3, 22, 0.9130434782608695, 22, 0.9166666666666666]
+  - ["JP", 1442037600000, 2181, 17589, 1442048400000, 1442052000000, -113, 2789, 3, 23, 0.9565217391304348, 23, 0.9583333333333334]
+  - ["JP", 1442052000000, 2789, 20378, 1442019600000, null, -113, 2789, 3, 24, 1.0, 24, 1.0]
+  - ["KE", 1442044800000, -1, -1, null, null, -1, -1, 1, 1, 0.0, 1, 1.0]
+  - ["KG", 1442073600000, 6, 6, null, null, 6, 6, 1, 1, 0.0, 1, 1.0]
+  - ["KR", 1442048400000, -374, -374, null, 1442026800000, -374, 3640, 1, 1, 0.0, 1, 0.045454545454545456]
+  - ["KR", 1442026800000, -179, -553, null, 1442077200000, -374, 3640, 1, 2, 0.047619047619047616, 2, 0.09090909090909091]
+  - ["KR", 1442077200000, -40, -593, 1442048400000, 1442098800000, -374, 3640, 1, 3, 0.09523809523809523, 3, 0.13636363636363635]
+  - ["KR", 1442098800000, -36, -629, 1442026800000, 1442080800000, -374, 3640, 1, 4, 0.14285714285714285, 4, 0.18181818181818182]
+  - ["KR", 1442080800000, -33, -662, 1442077200000, 1442052000000, -374, 3640, 1, 5, 0.19047619047619047, 5, 0.22727272727272727]
+  - ["KR", 1442052000000, -3, -665, 1442098800000, 1442041200000, -374, 3640, 1, 6, 0.23809523809523808, 6, 0.2727272727272727]
+  - ["KR", 1442041200000, 20, -645, 1442080800000, 1442037600000, -374, 3640, 1, 7, 0.2857142857142857, 7, 0.3181818181818182]
+  - ["KR", 1442037600000, 26, -619, 1442052000000, 1442059200000, -374, 3640, 1, 8, 0.3333333333333333, 8, 0.36363636363636365]
+  - ["KR", 1442059200000, 208, -411, 1442041200000, 1442070000000, -374, 3640, 2, 9, 0.38095238095238093, 9, 0.4090909090909091]
+  - ["KR", 1442070000000, 222, -189, 1442037600000, 1442084400000, -374, 3640, 2, 10, 0.42857142857142855, 10, 0.45454545454545453]
+  - ["KR", 1442084400000, 314, 125, 1442059200000, 1442023200000, -374, 3640, 2, 11, 0.47619047619047616, 11, 0.5]
+  - ["KR", 1442023200000, 319, 444, 1442070000000, 1442034000000, -374, 3640, 2, 12, 0.5238095238095238, 12, 0.5454545454545454]
+  - ["KR", 1442034000000, 434, 878, 1442084400000, 1442019600000, -374, 3640, 2, 13, 0.5714285714285714, 13, 0.5909090909090909]
+  - ["KR", 1442019600000, 445, 1323, 1442023200000, 1442088000000, -374, 3640, 2, 14, 0.6190476190476191, 14, 0.6363636363636364]
+  - ["KR", 1442088000000, 524, 1847, 1442034000000, 1442095200000, -374, 3640, 2, 15, 0.6666666666666666, 15, 0.6818181818181818]
+  - ["KR", 1442095200000, 827, 2674, 1442019600000, 1442044800000, -374, 3640, 3, 16, 0.7142857142857143, 16, 0.7272727272727273]
+  - ["KR", 1442044800000, 829, 3503, 1442088000000, 1442016000000, -374, 3640, 3, 17, 0.7619047619047619, 17, 0.7727272727272727]
+  - ["KR", 1442016000000, 1024, 4527, 1442095200000, 1442030400000, -374, 3640, 3, 18, 0.8095238095238095, 18, 0.8181818181818182]
+  - ["KR", 1442030400000, 1035, 5562, 1442044800000, 1442062800000, -374, 3640, 3, 19, 0.8571428571428571, 19, 0.8636363636363636]
+  - ["KR", 1442062800000, 1096, 6658, 1442016000000, 1442066400000, -374, 3640, 3, 20, 0.9047619047619048, 20, 0.9090909090909091]
+  - ["KR", 1442066400000, 3299, 9957, 1442030400000, 1442055600000, -374, 3640, 3, 21, 0.9523809523809523, 21, 0.9545454545454546]
+  - ["KR", 1442055600000, 3640, 13597, 1442062800000, null, -374, 3640, 3, 22, 1.0, 22, 1.0]
+  - ["KW", 1442080800000, -33, -33, null, 1442055600000, -33, 1815, 1, 1, 0.0, 1, 0.25]
+  - ["KW", 1442055600000, -2, -35, null, 1442077200000, -33, 1815, 1, 2, 0.3333333333333333, 2, 0.75]
+  - ["KW", 1442077200000, -2, -37, 1442080800000, 1442070000000, -33, 1815, 2, 2, 0.3333333333333333, 2, 0.75]
+  - ["KW", 1442070000000, 1815, 1778, 1442055600000, null, -33, 1815, 3, 4, 1.0, 3, 1.0]
+  - ["KZ", 1442077200000, -317, -317, null, 1442084400000, -317, 439, 1, 1, 0.0, 1, 0.09090909090909091]
+  - ["KZ", 1442084400000, -22, -339, null, 1442062800000, -317, 439, 1, 2, 0.1, 2, 0.18181818181818182]
+  - ["KZ", 1442062800000, 0, -339, 1442077200000, 1442066400000, -317, 439, 1, 3, 0.2, 3, 0.36363636363636365]
+  - ["KZ", 1442066400000, 0, -339, 1442084400000, 1442059200000, -317, 439, 1, 3, 0.2, 3, 0.36363636363636365]
+  - ["KZ", 1442059200000, 33, -306, 1442062800000, 1442055600000, -317, 439, 2, 5, 0.4, 4, 0.45454545454545453]
+  - ["KZ", 1442055600000, 63, -243, 1442066400000, 1442095200000, -317, 439, 2, 6, 0.5, 5, 0.5454545454545454]
+  - ["KZ", 1442095200000, 91, -152, 1442059200000, 1442034000000, -317, 439, 2, 7, 0.6, 6, 0.6363636363636364]
+  - ["KZ", 1442034000000, 161, 9, 1442055600000, 1442044800000, -317, 439, 2, 8, 0.7, 7, 0.7272727272727273]
+  - ["KZ", 1442044800000, 401, 410, 1442095200000, 1442052000000, -317, 439, 3, 9, 0.8, 8, 0.8181818181818182]
+  - ["KZ", 1442052000000, 412, 822, 1442034000000, 1442048400000, -317, 439, 3, 10, 0.9, 9, 0.9090909090909091]
+  - ["KZ", 1442048400000, 439, 1261, 1442044800000, null, -317, 439, 3, 11, 1.0, 10, 1.0]
+  - ["LB", 1442055600000, -67, -67, null, null, -67, -67, 1, 1, 0.0, 1, 1.0]
+  - ["LK", 1442084400000, -3, -3, null, 1442048400000, -3, 79, 1, 1, 0.0, 1, 0.25]
+  - ["LK", 1442048400000, 8, 5, null, 1442052000000, -3, 79, 1, 2, 0.3333333333333333, 2, 0.5]
+  - ["LK", 1442052000000, 47, 52, 1442084400000, 1442026800000, -3, 79, 2, 3, 0.6666666666666666, 3, 0.75]
+  - ["LK", 1442026800000, 79, 131, 1442048400000, null, -3, 79, 3, 4, 1.0, 4, 1.0]
+  - ["LT", 1442098800000, -24, -24, null, 1442080800000, -24, 12, 1, 1, 0.0, 1, 0.5]
+  - ["LT", 1442080800000, 12, -12, null, null, -24, 12, 2, 2, 1.0, 2, 1.0]
+  - ["LU", 1442066400000, 0, 0, null, 1442095200000, 0, 525, 1, 1, 0.0, 1, 0.25]
+  - ["LU", 1442095200000, 2, 2, null, 1442059200000, 0, 525, 1, 2, 0.3333333333333333, 2, 0.5]
+  - ["LU", 1442059200000, 79, 81, 1442066400000, 1442077200000, 0, 525, 2, 3, 0.6666666666666666, 3, 0.75]
+  - ["LU", 1442077200000, 525, 606, 1442095200000, null, 0, 525, 3, 4, 1.0, 4, 1.0]
+  - ["LV", 1442095200000, 0, 0, null, null, 0, 0, 1, 1, 0.0, 1, 1.0]
+  - ["MA", 1442059200000, -56, -56, null, 1442019600000, -56, 250, 1, 1, 0.0, 1, 0.14285714285714285]
+  - ["MA", 1442019600000, -1, -57, null, 1442062800000, -56, 250, 1, 2, 0.16666666666666666, 2, 0.2857142857142857]
+  - ["MA", 1442062800000, 0, -57, 1442059200000, 1442080800000, -56, 250, 1, 3, 0.3333333333333333, 3, 0.42857142857142855]
+  - ["MA", 1442080800000, 5, -52, 1442019600000, 1442098800000, -56, 250, 2, 4, 0.5, 4, 0.5714285714285714]
+  - ["MA", 1442098800000, 8, -44, 1442062800000, 1442055600000, -56, 250, 2, 5, 0.6666666666666666, 5, 0.7142857142857143]
+  - ["MA", 1442055600000, 23, -21, 1442080800000, 1442077200000, -56, 250, 3, 6, 0.8333333333333334, 6, 0.8571428571428571]
+  - ["MA", 1442077200000, 250, 229, 1442098800000, null, -56, 250, 3, 7, 1.0, 7, 1.0]
+  - ["MD", 1442077200000, 6916, 6916, null, null, 6916, 6916, 1, 1, 0.0, 1, 1.0]
+  - ["ME", 1442073600000, 0, 0, null, null, 0, 0, 1, 1, 0.0, 1, 1.0]
+  - ["MH", 1442052000000, 40, 40, null, null, 40, 40, 1, 1, 0.0, 1, 1.0]
+  - ["MK", 1442077200000, -72, -72, null, null, -72, -72, 1, 1, 0.0, 1, 1.0]
+  - ["MM", 1442070000000, 3, 3, null, 1442073600000, 3, 25, 1, 1, 0.0, 1, 0.5]
+  - ["MM", 1442073600000, 25, 28, null, null, 3, 25, 2, 2, 1.0, 2, 1.0]
+  - ["MO", 1442070000000, 18, 18, null, 1442034000000, 18, 30, 1, 1, 0.0, 1, 0.5]
+  - ["MO", 1442034000000, 30, 48, null, null, 18, 30, 2, 2, 1.0, 2, 1.0]
+  - ["MR", 1442080800000, 10, 10, null, null, 10, 10, 1, 1, 0.0, 1, 1.0]
+  - ["MT", 1442048400000, -1, -1, null, null, -1, -1, 1, 1, 0.0, 1, 1.0]
+  - ["MV", 1442073600000, -3, -3, null, null, -3, -3, 1, 1, 0.0, 1, 1.0]
+  - ["MX", 1442095200000, -456, -456, null, 1442080800000, -456, 3874, 1, 1, 0.0, 1, 0.058823529411764705]
+  - ["MX", 1442080800000, -376, -832, null, 1442041200000, -456, 3874, 1, 2, 0.0625, 2, 0.11764705882352941]
+  - ["MX", 1442041200000, -294, -1126, 1442095200000, 1442016000000, -456, 3874, 1, 3, 0.125, 3, 0.17647058823529413]
+  - ["MX", 1442016000000, -67, -1193, 1442080800000, 1442073600000, -456, 3874, 1, 4, 0.1875, 4, 0.23529411764705882]
+  - ["MX", 1442073600000, -21, -1214, 1442041200000, 1442066400000, -456, 3874, 1, 5, 0.25, 5, 0.29411764705882354]
+  - ["MX", 1442066400000, -1, -1215, 1442016000000, 1442070000000, -456, 3874, 1, 6, 0.3125, 6, 0.4117647058823529]
+  - ["MX", 1442070000000, -1, -1216, 1442073600000, 1442037600000, -456, 3874, 2, 6, 0.3125, 6, 0.4117647058823529]
+  - ["MX", 1442037600000, 4, -1212, 1442066400000, 1442098800000, -456, 3874, 2, 8, 0.4375, 7, 0.47058823529411764]
+  - ["MX", 1442098800000, 28, -1184, 1442070000000, 1442030400000, -456, 3874, 2, 9, 0.5, 8, 0.5294117647058824]
+  - ["MX", 1442030400000, 373, -811, 1442037600000, 1442088000000, -456, 3874, 2, 10, 0.5625, 9, 0.5882352941176471]
+  - ["MX", 1442088000000, 494, -317, 1442098800000, 1442023200000, -456, 3874, 2, 11, 0.625, 10, 0.6470588235294118]
+  - ["MX", 1442023200000, 549, 232, 1442030400000, 1442091600000, -456, 3874, 2, 12, 0.6875, 11, 0.7058823529411765]
+  - ["MX", 1442091600000, 799, 1031, 1442088000000, 1442034000000, -456, 3874, 3, 13, 0.75, 12, 0.7647058823529411]
+  - ["MX", 1442034000000, 944, 1975, 1442023200000, 1442084400000, -456, 3874, 3, 14, 0.8125, 13, 0.8235294117647058]
+  - ["MX", 1442084400000, 981, 2956, 1442091600000, 1442026800000, -456, 3874, 3, 15, 0.875, 14, 0.8823529411764706]
+  - ["MX", 1442026800000, 3642, 6598, 1442034000000, 1442077200000, -456, 3874, 3, 16, 0.9375, 15, 0.9411764705882353]
+  - ["MX", 1442077200000, 3874, 10472, 1442084400000, null, -456, 3874, 3, 17, 1.0, 16, 1.0]
+  - ["MY", 1442044800000, -127, -127, null, 1442077200000, -127, 1028, 1, 1, 0.0, 1, 0.08333333333333333]
+  - ["MY", 1442077200000, -10, -137, null, 1442019600000, -127, 1028, 1, 2, 0.09090909090909091, 2, 0.16666666666666666]
+  - ["MY", 1442019600000, -7, -144, 1442044800000, 1442030400000, -127, 1028, 1, 3, 0.18181818181818182, 3, 0.25]
+  - ["MY", 1442030400000, -3, -147, 1442077200000, 1442059200000, -127, 1028, 1, 4, 0.2727272727272727, 4, 0.3333333333333333]
+  - ["MY", 1442059200000, 0, -147, 1442019600000, 1442055600000, -127, 1028, 2, 5, 0.36363636363636365, 5, 0.4166666666666667]
+  - ["MY", 1442055600000, 1, -146, 1442030400000, 1442066400000, -127, 1028, 2, 6, 0.45454545454545453, 6, 0.6666666666666666]
+  - ["MY", 1442066400000, 1, -145, 1442059200000, 1442073600000, -127, 1028, 2, 6, 0.45454545454545453, 6, 0.6666666666666666]
+  - ["MY", 1442073600000, 1, -144, 1442055600000, 1442048400000, -127, 1028, 2, 6, 0.45454545454545453, 6, 0.6666666666666666]
+  - ["MY", 1442048400000, 649, 505, 1442066400000, 1442098800000, -127, 1028, 3, 9, 0.7272727272727273, 7, 0.75]
+  - ["MY", 1442098800000, 739, 1244, 1442073600000, 1442041200000, -127, 1028, 3, 10, 0.8181818181818182, 8, 0.8333333333333334]
+  - ["MY", 1442041200000, 935, 2179, 1442048400000, 1442034000000, -127, 1028, 3, 11, 0.9090909090909091, 9, 0.9166666666666666]
+  - ["MY", 1442034000000, 1028, 3207, 1442098800000, null, -127, 1028, 3, 12, 1.0, 10, 1.0]
+  - ["NG", 1442070000000, 6, 6, null, 1442052000000, 6, 208, 1, 1, 0.0, 1, 0.5]
+  - ["NG", 1442052000000, 208, 214, null, null, 6, 208, 2, 2, 1.0, 2, 1.0]
+  - ["NL", 1442070000000, -84, -84, null, 1442062800000, -84, 8947, 1, 1, 0.0, 1, 0.058823529411764705]
+  - ["NL", 1442062800000, -30, -114, null, 1442034000000, -84, 8947, 1, 2, 0.0625, 2, 0.11764705882352941]
+  - ["NL", 1442034000000, 0, -114, 1442070000000, 1442098800000, -84, 8947, 1, 3, 0.125, 3, 0.17647058823529413]
+  - ["NL", 1442098800000, 4, -110, 1442062800000, 1442088000000, -84, 8947, 1, 4, 0.1875, 4, 0.23529411764705882]
+  - ["NL", 1442088000000, 12, -98, 1442034000000, 1442044800000, -84, 8947, 1, 5, 0.25, 5, 0.29411764705882354]
+  - ["NL", 1442044800000, 16, -82, 1442098800000, 1442091600000, -84, 8947, 1, 6, 0.3125, 6, 0.35294117647058826]
+  - ["NL", 1442091600000, 19, -63, 1442088000000, 1442052000000, -84, 8947, 2, 7, 0.375, 7, 0.4117647058823529]
+  - ["NL", 1442052000000, 53, -10, 1442044800000, 1442066400000, -84, 8947, 2, 8, 0.4375, 8, 0.47058823529411764]
+  - ["NL", 1442066400000, 61, 51, 1442091600000, 1442095200000, -84, 8947, 2, 9, 0.5, 9, 0.5294117647058824]
+  - ["NL", 1442095200000, 70, 121, 1442052000000, 1442055600000, -84, 8947, 2, 10, 0.5625, 10, 0.5882352941176471]
+  - ["NL", 1442055600000, 105, 226, 1442066400000, 1442073600000, -84, 8947, 2, 11, 0.625, 11, 0.6470588235294118]
+  - ["NL", 1442073600000, 166, 392, 1442095200000, 1442059200000, -84, 8947, 2, 12, 0.6875, 12, 0.7058823529411765]
+  - ["NL", 1442059200000, 206, 598, 1442055600000, 1442084400000, -84, 8947, 3, 13, 0.75, 13, 0.7647058823529411]
+  - ["NL", 1442084400000, 436, 1034, 1442073600000, 1442077200000, -84, 8947, 3, 14, 0.8125, 14, 0.8235294117647058]
+  - ["NL", 1442077200000, 878, 1912, 1442059200000, 1442048400000, -84, 8947, 3, 15, 0.875, 15, 0.8823529411764706]
+  - ["NL", 1442048400000, 1303, 3215, 1442084400000, 1442080800000, -84, 8947, 3, 16, 0.9375, 16, 0.9411764705882353]
+  - ["NL", 1442080800000, 8947, 12162, 1442077200000, null, -84, 8947, 3, 17, 1.0, 17, 1.0]
+  - ["NO", 1442048400000, -447, -447, null, 1442095200000, -447, 447, 1, 1, 0.0, 1, 0.09090909090909091]
+  - ["NO", 1442095200000, -1, -448, null, 1442098800000, -447, 447, 1, 2, 0.1, 2, 0.18181818181818182]
+  - ["NO", 1442098800000, 2, -446, 1442048400000, 1442088000000, -447, 447, 1, 3, 0.2, 3, 0.2727272727272727]
+  - ["NO", 1442088000000, 15, -431, 1442095200000, 1442091600000, -447, 447, 1, 4, 0.3, 4, 0.45454545454545453]
+  - ["NO", 1442091600000, 15, -416, 1442098800000, 1442055600000, -447, 447, 2, 4, 0.3, 4, 0.45454545454545453]
+  - ["NO", 1442055600000, 29, -387, 1442088000000, 1442080800000, -447, 447, 2, 6, 0.5, 5, 0.5454545454545454]
+  - ["NO", 1442080800000, 31, -356, 1442091600000, 1442019600000, -447, 447, 2, 7, 0.6, 6, 0.6363636363636364]
+  - ["NO", 1442019600000, 48, -308, 1442055600000, 1442066400000, -447, 447, 2, 8, 0.7, 7, 0.7272727272727273]
+  - ["NO", 1442066400000, 71, -237, 1442080800000, 1442073600000, -447, 447, 3, 9, 0.8, 8, 0.8181818181818182]
+  - ["NO", 1442073600000, 222, -15, 1442019600000, 1442052000000, -447, 447, 3, 10, 0.9, 9, 0.9090909090909091]
+  - ["NO", 1442052000000, 447, 432, 1442066400000, null, -447, 447, 3, 11, 1.0, 10, 1.0]
+  - ["NP", 1442048400000, 61, 61, null, null, 61, 61, 1, 1, 0.0, 1, 1.0]
+  - ["NZ", 1442084400000, -52, -52, null, 1442095200000, -52, 635, 1, 1, 0.0, 1, 0.1111111111111111]
+  - ["NZ", 1442095200000, -4, -56, null, 1442098800000, -52, 635, 1, 2, 0.125, 2, 0.2222222222222222]
+  - ["NZ", 1442098800000, -2, -58, 1442084400000, 1442019600000, -52, 635, 1, 3, 0.25, 3, 0.3333333333333333]
+  - ["NZ", 1442019600000, 28, -30, 1442095200000, 1442037600000, -52, 635, 2, 4, 0.375, 4, 0.4444444444444444]
+  - ["NZ", 1442037600000, 66, 36, 1442098800000, 1442048400000, -52, 635, 2, 5, 0.5, 5, 0.5555555555555556]
+  - ["NZ", 1442048400000, 189, 225, 1442019600000, 1442088000000, -52, 635, 2, 6, 0.625, 6, 0.6666666666666666]
+  - ["NZ", 1442088000000, 405, 630, 1442037600000, 1442059200000, -52, 635, 3, 7, 0.75, 7, 0.7777777777777778]
+  - ["NZ", 1442059200000, 428, 1058, 1442048400000, 1442026800000, -52, 635, 3, 8, 0.875, 8, 0.8888888888888888]
+  - ["NZ", 1442026800000, 635, 1693, 1442088000000, null, -52, 635, 3, 9, 1.0, 9, 1.0]
+  - ["OM", 1442052000000, 0, 0, null, null, 0, 0, 1, 1, 0.0, 1, 1.0]
+  - ["PA", 1442026800000, 0, 0, null, null, 0, 0, 1, 1, 0.0, 1, 1.0]
+  - ["PE", 1442077200000, -163, -163, null, 1442084400000, -163, 1861, 1, 1, 0.0, 1, 0.1111111111111111]
+  - ["PE", 1442084400000, -68, -231, null, 1442095200000, -163, 1861, 1, 2, 0.125, 2, 0.2222222222222222]
+  - ["PE", 1442095200000, -19, -250, 1442077200000, 1442026800000, -163, 1861, 1, 3, 0.25, 3, 0.3333333333333333]
+  - ["PE", 1442026800000, -12, -262, 1442084400000, 1442062800000, -163, 1861, 2, 4, 0.375, 4, 0.5555555555555556]
+  - ["PE", 1442062800000, -12, -274, 1442095200000, 1442080800000, -163, 1861, 2, 4, 0.375, 4, 0.5555555555555556]
+  - ["PE", 1442080800000, -2, -276, 1442026800000, 1442023200000, -163, 1861, 2, 6, 0.625, 5, 0.6666666666666666]
+  - ["PE", 1442023200000, 26, -250, 1442062800000, 1442019600000, -163, 1861, 3, 7, 0.75, 6, 0.7777777777777778]
+  - ["PE", 1442019600000, 523, 273, 1442080800000, 1442098800000, -163, 1861, 3, 8, 0.875, 7, 0.8888888888888888]
+  - ["PE", 1442098800000, 1861, 2134, 1442023200000, null, -163, 1861, 3, 9, 1.0, 8, 1.0]
+  - ["PH", 1442073600000, -227, -227, null, 1442041200000, -227, 1969, 1, 1, 0.0, 1, 0.047619047619047616]
+  - ["PH", 1442041200000, 0, -227, null, 1442077200000, -227, 1969, 1, 2, 0.05, 2, 0.09523809523809523]
+  - ["PH", 1442077200000, 2, -225, 1442073600000, 1442019600000, -227, 1969, 1, 3, 0.1, 3, 0.14285714285714285]
+  - ["PH", 1442019600000, 6, -219, 1442041200000, 1442098800000, -227, 1969, 1, 4, 0.15, 4, 0.19047619047619047]
+  - ["PH", 1442098800000, 8, -211, 1442077200000, 1442037600000, -227, 1969, 1, 5, 0.2, 5, 0.23809523809523808]
+  - ["PH", 1442037600000, 17, -194, 1442019600000, 1442052000000, -227, 1969, 1, 6, 0.25, 6, 0.2857142857142857]
+  - ["PH", 1442052000000, 22, -172, 1442098800000, 1442030400000, -227, 1969, 1, 7, 0.3, 7, 0.3333333333333333]
+  - ["PH", 1442030400000, 26, -146, 1442037600000, 1442080800000, -227, 1969, 2, 8, 0.35, 8, 0.38095238095238093]
+  - ["PH", 1442080800000, 32, -114, 1442052000000, 1442070000000, -227, 1969, 2, 9, 0.4, 9, 0.42857142857142855]
+  - ["PH", 1442070000000, 34, -80, 1442030400000, 1442084400000, -227, 1969, 2, 10, 0.45, 10, 0.47619047619047616]
+  - ["PH", 1442084400000, 39, -41, 1442080800000, 1442044800000, -227, 1969, 2, 11, 0.5, 11, 0.5238095238095238]
+  - ["PH", 1442044800000, 55, 14, 1442070000000, 1442034000000, -227, 1969, 2, 12, 0.55, 12, 0.5714285714285714]
+  - ["PH", 1442034000000, 59, 73, 1442084400000, 1442048400000, -227, 1969, 2, 13, 0.6, 13, 0.6190476190476191]
+  - ["PH", 1442048400000, 62, 135, 1442044800000, 1442062800000, -227, 1969, 2, 14, 0.65, 14, 0.6666666666666666]
+  - ["PH", 1442062800000, 171, 306, 1442034000000, 1442059200000, -227, 1969, 3, 15, 0.7, 15, 0.7142857142857143]
+  - ["PH", 1442059200000, 273, 579, 1442048400000, 1442023200000, -227, 1969, 3, 16, 0.75, 16, 0.7619047619047619]
+  - ["PH", 1442023200000, 459, 1038, 1442062800000, 1442091600000, -227, 1969, 3, 17, 0.8, 17, 0.8095238095238095]
+  - ["PH", 1442091600000, 816, 1854, 1442059200000, 1442026800000, -227, 1969, 3, 18, 0.85, 18, 0.8571428571428571]
+  - ["PH", 1442026800000, 910, 2764, 1442023200000, 1442066400000, -227, 1969, 3, 19, 0.9, 19, 0.9047619047619048]
+  - ["PH", 1442066400000, 1880, 4644, 1442091600000, 1442055600000, -227, 1969, 3, 20, 0.95, 20, 0.9523809523809523]
+  - ["PH", 1442055600000, 1969, 6613, 1442026800000, null, -227, 1969, 3, 21, 1.0, 21, 1.0]
+  - ["PK", 1442048400000, 15, 15, null, 1442062800000, 15, 335, 1, 1, 0.0, 1, 0.14285714285714285]
+  - ["PK", 1442062800000, 23, 38, null, 1442041200000, 15, 335, 1, 2, 0.16666666666666666, 2, 0.2857142857142857]
+  - ["PK", 1442041200000, 24, 62, 1442048400000, 1442070000000, 15, 335, 1, 3, 0.3333333333333333, 3, 0.42857142857142855]
+  - ["PK", 1442070000000, 43, 105, 1442062800000, 1442037600000, 15, 335, 2, 4, 0.5, 4, 0.5714285714285714]
+  - ["PK", 1442037600000, 100, 205, 1442041200000, 1442026800000, 15, 335, 2, 5, 0.6666666666666666, 5, 0.7142857142857143]
+  - ["PK", 1442026800000, 101, 306, 1442070000000, 1442019600000, 15, 335, 3, 6, 0.8333333333333334, 6, 0.8571428571428571]
+  - ["PK", 1442019600000, 335, 641, 1442037600000, null, 15, 335, 3, 7, 1.0, 7, 1.0]
+  - ["PL", 1442098800000, -9, -9, null, 1442080800000, -9, 4171, 1, 1, 0.0, 1, 0.05555555555555555]
+  - ["PL", 1442080800000, 7, -2, null, 1442084400000, -9, 4171, 1, 2, 0.058823529411764705, 2, 0.1111111111111111]
+  - ["PL", 1442084400000, 13, 11, 1442098800000, 1442073600000, -9, 4171, 1, 3, 0.11764705882352941, 3, 0.16666666666666666]
+  - ["PL", 1442073600000, 30, 41, 1442080800000, 1442066400000, -9, 4171, 1, 4, 0.17647058823529413, 4, 0.2222222222222222]
+  - ["PL", 1442066400000, 34, 75, 1442084400000, 1442037600000, -9, 4171, 1, 5, 0.23529411764705882, 5, 0.2777777777777778]
+  - ["PL", 1442037600000, 95, 170, 1442073600000, 1442070000000, -9, 4171, 1, 6, 0.29411764705882354, 6, 0.3333333333333333]
+  - ["PL", 1442070000000, 146, 316, 1442066400000, 1442059200000, -9, 4171, 2, 7, 0.35294117647058826, 7, 0.3888888888888889]
+  - ["PL", 1442059200000, 199, 515, 1442037600000, 1442041200000, -9, 4171, 2, 8, 0.4117647058823529, 8, 0.4444444444444444]
+  - ["PL", 1442041200000, 281, 796, 1442070000000, 1442044800000, -9, 4171, 2, 9, 0.47058823529411764, 9, 0.5]
+  - ["PL", 1442044800000, 319, 1115, 1442059200000, 1442077200000, -9, 4171, 2, 10, 0.5294117647058824, 10, 0.5555555555555556]
+  - ["PL", 1442077200000, 324, 1439, 1442041200000, 1442052000000, -9, 4171, 2, 11, 0.5882352941176471, 11, 0.6111111111111112]
+  - ["PL", 1442052000000, 330, 1769, 1442044800000, 1442088000000, -9, 4171, 2, 12, 0.6470588235294118, 12, 0.6666666666666666]
+  - ["PL", 1442088000000, 346, 2115, 1442077200000, 1442048400000, -9, 4171, 3, 13, 0.7058823529411765, 13, 0.7222222222222222]
+  - ["PL", 1442048400000, 366, 2481, 1442052000000, 1442055600000, -9, 4171, 3, 14, 0.7647058823529411, 14, 0.7777777777777778]
+  - ["PL", 1442055600000, 410, 2891, 1442088000000, 1442091600000, -9, 4171, 3, 15, 0.8235294117647058, 15, 0.8333333333333334]
+  - ["PL", 1442091600000, 902, 3793, 1442048400000, 1442095200000, -9, 4171, 3, 16, 0.8823529411764706, 16, 0.8888888888888888]
+  - ["PL", 1442095200000, 1851, 5644, 1442055600000, 1442062800000, -9, 4171, 3, 17, 0.9411764705882353, 17, 0.9444444444444444]
+  - ["PL", 1442062800000, 4171, 9815, 1442091600000, null, -9, 4171, 3, 18, 1.0, 18, 1.0]
+  - ["PR", 1442059200000, -35, -35, null, 1442030400000, -35, 29, 1, 1, 0.0, 1, 0.2]
+  - ["PR", 1442030400000, 2, -33, null, 1442077200000, -35, 29, 1, 2, 0.25, 2, 0.4]
+  - ["PR", 1442077200000, 5, -28, 1442059200000, 1442026800000, -35, 29, 2, 3, 0.5, 3, 0.6]
+  - ["PR", 1442026800000, 22, -6, 1442030400000, 1442095200000, -35, 29, 2, 4, 0.75, 4, 0.8]
+  - ["PR", 1442095200000, 29, 23, 1442077200000, null, -35, 29, 3, 5, 1.0, 5, 1.0]
+  - ["PT", 1442080800000, -79, -79, null, 1442077200000, -79, 3470, 1, 1, 0.0, 1, 0.1]
+  - ["PT", 1442077200000, -75, -154, null, 1442098800000, -79, 3470, 1, 2, 0.1111111111111111, 2, 0.2]
+  - ["PT", 1442098800000, 2, -152, 1442080800000, 1442044800000, -79, 3470, 1, 3, 0.2222222222222222, 3, 0.3]
+  - ["PT", 1442044800000, 11, -141, 1442077200000, 1442066400000, -79, 3470, 1, 4, 0.3333333333333333, 4, 0.4]
+  - ["PT", 1442066400000, 12, -129, 1442098800000, 1442095200000, -79, 3470, 2, 5, 0.4444444444444444, 5, 0.5]
+  - ["PT", 1442095200000, 19, -110, 1442044800000, 1442052000000, -79, 3470, 2, 6, 0.5555555555555556, 6, 0.6]
+  - ["PT", 1442052000000, 102, -8, 1442066400000, 1442019600000, -79, 3470, 2, 7, 0.6666666666666666, 7, 0.7]
+  - ["PT", 1442019600000, 172, 164, 1442095200000, 1442088000000, -79, 3470, 3, 8, 0.7777777777777778, 8, 0.8]
+  - ["PT", 1442088000000, 403, 567, 1442052000000, 1442070000000, -79, 3470, 3, 9, 0.8888888888888888, 9, 0.9]
+  - ["PT", 1442070000000, 3470, 4037, 1442019600000, null, -79, 3470, 3, 10, 1.0, 10, 1.0]
+  - ["PY", 1442019600000, 1, 1, null, 1442080800000, 1, 628, 1, 1, 0.0, 1, 0.3333333333333333]
+  - ["PY", 1442080800000, 5, 6, null, 1442084400000, 1, 628, 2, 2, 0.5, 2, 0.6666666666666666]
+  - ["PY", 1442084400000, 628, 634, 1442019600000, null, 1, 628, 3, 3, 1.0, 3, 1.0]
+  - ["QA", 1442041200000, 13, 13, null, null, 13, 13, 1, 1, 0.0, 1, 1.0]
+  - ["RO", 1442070000000, -29, -29, null, 1442091600000, -29, 845, 1, 1, 0.0, 1, 0.1]
+  - ["RO", 1442091600000, 0, -29, null, 1442073600000, -29, 845, 1, 2, 0.1111111111111111, 2, 0.2]
+  - ["RO", 1442073600000, 15, -14, 1442070000000, 1442055600000, -29, 845, 1, 3, 0.2222222222222222, 3, 0.3]
+  - ["RO", 1442055600000, 26, 12, 1442091600000, 1442034000000, -29, 845, 1, 4, 0.3333333333333333, 4, 0.4]
+  - ["RO", 1442034000000, 68, 80, 1442073600000, 1442044800000, -29, 845, 2, 5, 0.4444444444444444, 5, 0.5]
+  - ["RO", 1442044800000, 284, 364, 1442055600000, 1442052000000, -29, 845, 2, 6, 0.5555555555555556, 6, 0.6]
+  - ["RO", 1442052000000, 319, 683, 1442034000000, 1442062800000, -29, 845, 2, 7, 0.6666666666666666, 7, 0.7]
+  - ["RO", 1442062800000, 541, 1224, 1442044800000, 1442095200000, -29, 845, 3, 8, 0.7777777777777778, 8, 0.8]
+  - ["RO", 1442095200000, 824, 2048, 1442052000000, 1442041200000, -29, 845, 3, 9, 0.8888888888888888, 9, 0.9]
+  - ["RO", 1442041200000, 845, 2893, 1442062800000, null, -29, 845, 3, 10, 1.0, 10, 1.0]
+  - ["RS", 1442091600000, -15, -15, null, 1442066400000, -15, 813, 1, 1, 0.0, 1, 0.14285714285714285]
+  - ["RS", 1442066400000, 0, -15, null, 1442080800000, -15, 813, 1, 2, 0.16666666666666666, 2, 0.42857142857142855]
+  - ["RS", 1442080800000, 0, -15, 1442091600000, 1442019600000, -15, 813, 1, 2, 0.16666666666666666, 2, 0.42857142857142855]
+  - ["RS", 1442019600000, 6, -9, 1442066400000, 1442062800000, -15, 813, 2, 4, 0.5, 3, 0.5714285714285714]
+  - ["RS", 1442062800000, 13, 4, 1442080800000, 1442084400000, -15, 813, 2, 5, 0.6666666666666666, 4, 0.7142857142857143]
+  - ["RS", 1442084400000, 89, 93, 1442019600000, 1442073600000, -15, 813, 3, 6, 0.8333333333333334, 5, 0.8571428571428571]
+  - ["RS", 1442073600000, 813, 906, 1442062800000, null, -15, 813, 3, 7, 1.0, 6, 1.0]
+  - ["RU", 1442037600000, -324, -324, null, 1442026800000, -324, 12098, 1, 1, 0.0, 1, 0.043478260869565216]
+  - ["RU", 1442026800000, 0, -324, null, 1442030400000, -324, 12098, 1, 2, 0.045454545454545456, 2, 0.08695652173913043]
+  - ["RU", 1442030400000, 76, -248, 1442037600000, 1442062800000, -324, 12098, 1, 3, 0.09090909090909091, 3, 0.13043478260869565]
+  - ["RU", 1442062800000, 168, -80, 1442026800000, 1442023200000, -324, 12098, 1, 4, 0.13636363636363635, 4, 0.17391304347826086]
+  - ["RU", 1442023200000, 299, 219, 1442030400000, 1442095200000, -324, 12098, 1, 5, 0.18181818181818182, 5, 0.21739130434782608]
+  - ["RU", 1442095200000, 435, 654, 1442062800000, 1442055600000, -324, 12098, 1, 6, 0.22727272727272727, 6, 0.2608695652173913]
+  - ["RU", 1442055600000, 499, 1153, 1442023200000, 1442041200000, -324, 12098, 1, 7, 0.2727272727272727, 7, 0.30434782608695654]
+  - ["RU", 1442041200000, 580, 1733, 1442095200000, 1442080800000, -324, 12098, 1, 8, 0.3181818181818182, 8, 0.34782608695652173]
+  - ["RU", 1442080800000, 655, 2388, 1442055600000, 1442034000000, -324, 12098, 2, 9, 0.36363636363636365, 9, 0.391304347826087]
+  - ["RU", 1442034000000, 658, 3046, 1442041200000, 1442048400000, -324, 12098, 2, 10, 0.4090909090909091, 10, 0.43478260869565216]
+  - ["RU", 1442048400000, 1027, 4073, 1442080800000, 1442077200000, -324, 12098, 2, 11, 0.45454545454545453, 11, 0.4782608695652174]
+  - ["RU", 1442077200000, 1162, 5235, 1442034000000, 1442052000000, -324, 12098, 2, 12, 0.5, 12, 0.5217391304347826]
+  - ["RU", 1442052000000, 1214, 6449, 1442048400000, 1442073600000, -324, 12098, 2, 13, 0.5454545454545454, 13, 0.5652173913043478]
+  - ["RU", 1442073600000, 1618, 8067, 1442077200000, 1442066400000, -324, 12098, 2, 14, 0.5909090909090909, 14, 0.6086956521739131]
+  - ["RU", 1442066400000, 2047, 10114, 1442052000000, 1442019600000, -324, 12098, 2, 15, 0.6363636363636364, 15, 0.6521739130434783]
+  - ["RU", 1442019600000, 2214, 12328, 1442073600000, 1442044800000, -324, 12098, 2, 16, 0.6818181818181818, 16, 0.6956521739130435]
+  - ["RU", 1442044800000, 2564, 14892, 1442066400000, 1442088000000, -324, 12098, 3, 17, 0.7272727272727273, 17, 0.7391304347826086]
+  - ["RU", 1442088000000, 2596, 17488, 1442019600000, 1442091600000, -324, 12098, 3, 18, 0.7727272727272727, 18, 0.782608695652174]
+  - ["RU", 1442091600000, 3449, 20937, 1442044800000, 1442059200000, -324, 12098, 3, 19, 0.8181818181818182, 19, 0.8260869565217391]
+  - ["RU", 1442059200000, 3902, 24839, 1442088000000, 1442070000000, -324, 12098, 3, 20, 0.8636363636363636, 20, 0.8695652173913043]
+  - ["RU", 1442070000000, 4706, 29545, 1442091600000, 1442084400000, -324, 12098, 3, 21, 0.9090909090909091, 21, 0.9130434782608695]
+  - ["RU", 1442084400000, 6461, 36006, 1442059200000, 1442098800000, -324, 12098, 3, 22, 0.9545454545454546, 22, 0.9565217391304348]
+  - ["RU", 1442098800000, 12098, 48104, 1442070000000, null, -324, 12098, 3, 23, 1.0, 23, 1.0]
+  - ["SA", 1442037600000, -97, -97, null, 1442077200000, -97, 1276, 1, 1, 0.0, 1, 0.125]
+  - ["SA", 1442077200000, -50, -147, null, 1442059200000, -97, 1276, 1, 2, 0.14285714285714285, 2, 0.25]
+  - ["SA", 1442059200000, 0, -147, 1442037600000, 1442073600000, -97, 1276, 1, 3, 0.2857142857142857, 3, 0.375]
+  - ["SA", 1442073600000, 2, -145, 1442077200000, 1442055600000, -97, 1276, 2, 4, 0.42857142857142855, 4, 0.5]
+  - ["SA", 1442055600000, 11, -134, 1442059200000, 1442048400000, -97, 1276, 2, 5, 0.5714285714285714, 5, 0.625]
+  - ["SA", 1442048400000, 14, -120, 1442073600000, 1442084400000, -97, 1276, 2, 6, 0.7142857142857143, 6, 0.75]
+  - ["SA", 1442084400000, 458, 338, 1442055600000, 1442066400000, -97, 1276, 3, 7, 0.8571428571428571, 7, 0.875]
+  - ["SA", 1442066400000, 1276, 1614, 1442048400000, null, -97, 1276, 3, 8, 1.0, 8, 1.0]
+  - ["SE", 1442048400000, -145, -145, null, 1442055600000, -145, 1476, 1, 1, 0.0, 1, 0.06666666666666667]
+  - ["SE", 1442055600000, -5, -150, null, 1442091600000, -145, 1476, 1, 2, 0.07142857142857142, 2, 0.13333333333333333]
+  - ["SE", 1442091600000, -1, -151, 1442048400000, 1442098800000, -145, 1476, 1, 3, 0.14285714285714285, 3, 0.2]
+  - ["SE", 1442098800000, 0, -151, 1442055600000, 1442052000000, -145, 1476, 1, 4, 0.21428571428571427, 4, 0.26666666666666666]
+  - ["SE", 1442052000000, 1, -150, 1442091600000, 1442023200000, -145, 1476, 1, 5, 0.2857142857142857, 5, 0.3333333333333333]
+  - ["SE", 1442023200000, 3, -147, 1442098800000, 1442066400000, -145, 1476, 2, 6, 0.35714285714285715, 6, 0.4]
+  - ["SE", 1442066400000, 14, -133, 1442052000000, 1442030400000, -145, 1476, 2, 7, 0.42857142857142855, 7, 0.4666666666666667]
+  - ["SE", 1442030400000, 30, -103, 1442023200000, 1442084400000, -145, 1476, 2, 8, 0.5, 8, 0.5333333333333333]
+  - ["SE", 1442084400000, 37, -66, 1442066400000, 1442095200000, -145, 1476, 2, 9, 0.5714285714285714, 9, 0.6]
+  - ["SE", 1442095200000, 61, -5, 1442030400000, 1442070000000, -145, 1476, 2, 10, 0.6428571428571429, 10, 0.6666666666666666]
+  - ["SE", 1442070000000, 78, 73, 1442084400000, 1442080800000, -145, 1476, 3, 11, 0.7142857142857143, 11, 0.7333333333333333]
+  - ["SE", 1442080800000, 89, 162, 1442095200000, 1442041200000, -145, 1476, 3, 12, 0.7857142857142857, 12, 0.8]
+  - ["SE", 1442041200000, 91, 253, 1442070000000, 1442019600000, -145, 1476, 3, 13, 0.8571428571428571, 13, 0.8666666666666667]
+  - ["SE", 1442019600000, 109, 362, 1442080800000, 1442059200000, -145, 1476, 3, 14, 0.9285714285714286, 14, 0.9333333333333333]
+  - ["SE", 1442059200000, 1476, 1838, 1442041200000, null, -145, 1476, 3, 15, 1.0, 15, 1.0]
+  - ["SG", 1442066400000, 0, 0, null, 1442030400000, 0, 2758, 1, 1, 0.0, 1, 0.125]
+  - ["SG", 1442030400000, 1, 1, null, 1442037600000, 0, 2758, 1, 2, 0.14285714285714285, 2, 0.25]
+  - ["SG", 1442037600000, 3, 4, 1442066400000, 1442048400000, 0, 2758, 1, 3, 0.2857142857142857, 3, 0.375]
+  - ["SG", 1442048400000, 52, 56, 1442030400000, 1442041200000, 0, 2758, 2, 4, 0.42857142857142855, 4, 0.5]
+  - ["SG", 1442041200000, 59, 115, 1442037600000, 1442044800000, 0, 2758, 2, 5, 0.5714285714285714, 5, 0.625]
+  - ["SG", 1442044800000, 77, 192, 1442048400000, 1442062800000, 0, 2758, 2, 6, 0.7142857142857143, 6, 0.75]
+  - ["SG", 1442062800000, 388, 580, 1442041200000, 1442026800000, 0, 2758, 3, 7, 0.8571428571428571, 7, 0.875]
+  - ["SG", 1442026800000, 2758, 3338, 1442044800000, null, 0, 2758, 3, 8, 1.0, 8, 1.0]
+  - ["SI", 1442080800000, -45, -45, null, 1442091600000, -45, 9, 1, 1, 0.0, 1, 0.5]
+  - ["SI", 1442091600000, 9, -36, null, null, -45, 9, 2, 2, 1.0, 2, 1.0]
+  - ["SK", 1442084400000, -92, -92, null, 1442037600000, -92, 446, 1, 1, 0.0, 1, 0.16666666666666666]
+  - ["SK", 1442037600000, -1, -93, null, 1442062800000, -92, 446, 1, 2, 0.2, 2, 0.3333333333333333]
+  - ["SK", 1442062800000, 6, -87, 1442084400000, 1442098800000, -92, 446, 2, 3, 0.4, 3, 0.5]
+  - ["SK", 1442098800000, 7, -80, 1442037600000, 1442052000000, -92, 446, 2, 4, 0.6, 4, 0.6666666666666666]
+  - ["SK", 1442052000000, 13, -67, 1442062800000, 1442073600000, -92, 446, 3, 5, 0.8, 5, 0.8333333333333334]
+  - ["SK", 1442073600000, 446, 379, 1442098800000, null, -92, 446, 3, 6, 1.0, 6, 1.0]
+  - ["SV", 1442019600000, -1, -1, null, 1442088000000, -1, 106, 1, 1, 0.0, 1, 0.3333333333333333]
+  - ["SV", 1442088000000, 9, 8, null, 1442084400000, -1, 106, 2, 2, 0.5, 2, 0.6666666666666666]
+  - ["SV", 1442084400000, 106, 114, 1442019600000, null, -1, 106, 3, 3, 1.0, 3, 1.0]
+  - ["TH", 1442062800000, -46, -46, null, 1442066400000, -46, 110, 1, 1, 0.0, 1, 0.1111111111111111]
+  - ["TH", 1442066400000, -34, -80, null, 1442052000000, -46, 110, 1, 2, 0.125, 2, 0.2222222222222222]
+  - ["TH", 1442052000000, -22, -102, 1442062800000, 1442034000000, -46, 110, 1, 3, 0.25, 3, 0.3333333333333333]
+  - ["TH", 1442034000000, 0, -102, 1442066400000, 1442055600000, -46, 110, 2, 4, 0.375, 4, 0.6666666666666666]
+  - ["TH", 1442055600000, 0, -102, 1442052000000, 1442070000000, -46, 110, 2, 4, 0.375, 4, 0.6666666666666666]
+  - ["TH", 1442070000000, 0, -102, 1442034000000, 1442041200000, -46, 110, 2, 4, 0.375, 4, 0.6666666666666666]
+  - ["TH", 1442041200000, 3, -99, 1442055600000, 1442084400000, -46, 110, 3, 7, 0.75, 5, 0.7777777777777778]
+  - ["TH", 1442084400000, 13, -86, 1442070000000, 1442044800000, -46, 110, 3, 8, 0.875, 6, 0.8888888888888888]
+  - ["TH", 1442044800000, 110, 24, 1442041200000, null, -46, 110, 3, 9, 1.0, 7, 1.0]
+  - ["TJ", 1442048400000, 1471, 1471, null, null, 1471, 1471, 1, 1, 0.0, 1, 1.0]
+  - ["TN", 1442098800000, -9, -9, null, null, -9, -9, 1, 1, 0.0, 1, 1.0]
+  - ["TR", 1442095200000, -29, -29, null, 1442080800000, -29, 3048, 1, 1, 0.0, 1, 0.06666666666666667]
+  - ["TR", 1442080800000, -1, -30, null, 1442041200000, -29, 3048, 1, 2, 0.07142857142857142, 2, 0.13333333333333333]
+  - ["TR", 1442041200000, 1, -29, 1442095200000, 1442044800000, -29, 3048, 1, 3, 0.14285714285714285, 3, 0.2]
+  - ["TR", 1442044800000, 41, 12, 1442080800000, 1442052000000, -29, 3048, 1, 4, 0.21428571428571427, 4, 0.3333333333333333]
+  - ["TR", 1442052000000, 41, 53, 1442041200000, 1442066400000, -29, 3048, 1, 4, 0.21428571428571427, 4, 0.3333333333333333]
+  - ["TR", 1442066400000, 85, 138, 1442044800000, 1442048400000, -29, 3048, 2, 6, 0.35714285714285715, 5, 0.4]
+  - ["TR", 1442048400000, 88, 226, 1442052000000, 1442077200000, -29, 3048, 2, 7, 0.42857142857142855, 6, 0.4666666666666667]
+  - ["TR", 1442077200000, 89, 315, 1442066400000, 1442084400000, -29, 3048, 2, 8, 0.5, 7, 0.5333333333333333]
+  - ["TR", 1442084400000, 170, 485, 1442048400000, 1442070000000, -29, 3048, 2, 9, 0.5714285714285714, 8, 0.6]
+  - ["TR", 1442070000000, 236, 721, 1442077200000, 1442055600000, -29, 3048, 2, 10, 0.6428571428571429, 9, 0.6666666666666666]
+  - ["TR", 1442055600000, 299, 1020, 1442084400000, 1442023200000, -29, 3048, 3, 11, 0.7142857142857143, 10, 0.7333333333333333]
+  - ["TR", 1442023200000, 306, 1326, 1442070000000, 1442062800000, -29, 3048, 3, 12, 0.7857142857142857, 11, 0.8]
+  - ["TR", 1442062800000, 315, 1641, 1442055600000, 1442088000000, -29, 3048, 3, 13, 0.8571428571428571, 12, 0.8666666666666667]
+  - ["TR", 1442088000000, 2389, 4030, 1442023200000, 1442091600000, -29, 3048, 3, 14, 0.9285714285714286, 13, 0.9333333333333333]
+  - ["TR", 1442091600000, 3048, 7078, 1442062800000, null, -29, 3048, 3, 15, 1.0, 14, 1.0]
+  - ["TT", 1442088000000, 9, 9, null, null, 9, 9, 1, 1, 0.0, 1, 1.0]
+  - ["TW", 1442062800000, -272, -272, null, 1442059200000, -272, 772, 1, 1, 0.0, 1, 0.045454545454545456]
+  - ["TW", 1442059200000, -157, -429, null, 1442095200000, -272, 772, 1, 2, 0.047619047619047616, 2, 0.09090909090909091]
+  - ["TW", 1442095200000, -77, -506, 1442062800000, 1442098800000, -272, 772, 1, 3, 0.09523809523809523, 3, 0.13636363636363635]
+  - ["TW", 1442098800000, -60, -566, 1442059200000, 1442019600000, -272, 772, 1, 4, 0.14285714285714285, 4, 0.18181818181818182]
+  - ["TW", 1442019600000, 0, -566, 1442095200000, 1442030400000, -272, 772, 1, 5, 0.19047619047619047, 5, 0.3181818181818182]
+  - ["TW", 1442030400000, 0, -566, 1442098800000, 1442084400000, -272, 772, 1, 5, 0.19047619047619047, 5, 0.3181818181818182]
+  - ["TW", 1442084400000, 0, -566, 1442019600000, 1442044800000, -272, 772, 1, 5, 0.19047619047619047, 5, 0.3181818181818182]
+  - ["TW", 1442044800000, 24, -542, 1442030400000, 1442052000000, -272, 772, 1, 8, 0.3333333333333333, 6, 0.45454545454545453]
+  - ["TW", 1442052000000, 24, -518, 1442084400000, 1442080800000, -272, 772, 2, 8, 0.3333333333333333, 6, 0.45454545454545453]
+  - ["TW", 1442080800000, 24, -494, 1442044800000, 1442055600000, -272, 772, 2, 8, 0.3333333333333333, 6, 0.45454545454545453]
+  - ["TW", 1442055600000, 48, -446, 1442052000000, 1442048400000, -272, 772, 2, 11, 0.47619047619047616, 7, 0.5]
+  - ["TW", 1442048400000, 75, -371, 1442080800000, 1442016000000, -272, 772, 2, 12, 0.5238095238095238, 8, 0.5454545454545454]
+  - ["TW", 1442016000000, 92, -279, 1442055600000, 1442023200000, -272, 772, 2, 13, 0.5714285714285714, 9, 0.5909090909090909]
+  - ["TW", 1442023200000, 97, -182, 1442048400000, 1442034000000, -272, 772, 2, 14, 0.6190476190476191, 10, 0.6363636363636364]
+  - ["TW", 1442034000000, 143, -39, 1442016000000, 1442037600000, -272, 772, 2, 15, 0.6666666666666666, 11, 0.6818181818181818]
+  - ["TW", 1442037600000, 266, 227, 1442023200000, 1442041200000, -272, 772, 3, 16, 0.7142857142857143, 12, 0.7272727272727273]
+  - ["TW", 1442041200000, 366, 593, 1442034000000, 1442070000000, -272, 772, 3, 17, 0.7619047619047619, 13, 0.7727272727272727]
+  - ["TW", 1442070000000, 485, 1078, 1442037600000, 1442077200000, -272, 772, 3, 18, 0.8095238095238095, 14, 0.8181818181818182]
+  - ["TW", 1442077200000, 502, 1580, 1442041200000, 1442066400000, -272, 772, 3, 19, 0.8571428571428571, 15, 0.8636363636363636]
+  - ["TW", 1442066400000, 624, 2204, 1442070000000, 1442026800000, -272, 772, 3, 20, 0.9047619047619048, 16, 0.9090909090909091]
+  - ["TW", 1442026800000, 680, 2884, 1442077200000, 1442073600000, -272, 772, 3, 21, 0.9523809523809523, 17, 0.9545454545454546]
+  - ["TW", 1442073600000, 772, 3656, 1442066400000, null, -272, 772, 3, 22, 1.0, 18, 1.0]
+  - ["UA", 1442091600000, -388, -388, null, 1442077200000, -388, 14202, 1, 1, 0.0, 1, 0.05263157894736842]
+  - ["UA", 1442077200000, -181, -569, null, 1442095200000, -388, 14202, 1, 2, 0.05555555555555555, 2, 0.10526315789473684]
+  - ["UA", 1442095200000, -30, -599, 1442091600000, 1442088000000, -388, 14202, 1, 3, 0.1111111111111111, 3, 0.15789473684210525]
+  - ["UA", 1442088000000, -21, -620, 1442077200000, 1442059200000, -388, 14202, 1, 4, 0.16666666666666666, 4, 0.21052631578947367]
+  - ["UA", 1442059200000, -2, -622, 1442095200000, 1442037600000, -388, 14202, 1, 5, 0.2222222222222222, 5, 0.2631578947368421]
+  - ["UA", 1442037600000, -1, -623, 1442088000000, 1442080800000, -388, 14202, 1, 6, 0.2777777777777778, 6, 0.3684210526315789]
+  - ["UA", 1442080800000, -1, -624, 1442059200000, 1442048400000, -388, 14202, 1, 6, 0.2777777777777778, 6, 0.3684210526315789]
+  - ["UA", 1442048400000, 2, -622, 1442037600000, 1442084400000, -388, 14202, 2, 8, 0.3888888888888889, 7, 0.42105263157894735]
+  - ["UA", 1442084400000, 5, -617, 1442080800000, 1442098800000, -388, 14202, 2, 9, 0.4444444444444444, 8, 0.47368421052631576]
+  - ["UA", 1442098800000, 38, -579, 1442048400000, 1442041200000, -388, 14202, 2, 10, 0.5, 9, 0.5263157894736842]
+  - ["UA", 1442041200000, 74, -505, 1442084400000, 1442044800000, -388, 14202, 2, 11, 0.5555555555555556, 10, 0.5789473684210527]
+  - ["UA", 1442044800000, 280, -225, 1442098800000, 1442066400000, -388, 14202, 2, 12, 0.6111111111111112, 11, 0.631578947368421]
+  - ["UA", 1442066400000, 296, 71, 1442041200000, 1442052000000, -388, 14202, 2, 13, 0.6666666666666666, 12, 0.6842105263157895]
+  - ["UA", 1442052000000, 410, 481, 1442044800000, 1442062800000, -388, 14202, 3, 14, 0.7222222222222222, 13, 0.7368421052631579]
+  - ["UA", 1442062800000, 773, 1254, 1442066400000, 1442070000000, -388, 14202, 3, 15, 0.7777777777777778, 14, 0.7894736842105263]
+  - ["UA", 1442070000000, 1733, 2987, 1442052000000, 1442034000000, -388, 14202, 3, 16, 0.8333333333333334, 15, 0.8421052631578947]
+  - ["UA", 1442034000000, 3468, 6455, 1442062800000, 1442073600000, -388, 14202, 3, 17, 0.8888888888888888, 16, 0.8947368421052632]
+  - ["UA", 1442073600000, 4241, 10696, 1442070000000, 1442055600000, -388, 14202, 3, 18, 0.9444444444444444, 17, 0.9473684210526315]
+  - ["UA", 1442055600000, 14202, 24898, 1442034000000, null, -388, 14202, 3, 19, 1.0, 18, 1.0]
+  - ["UG", 1442070000000, 1, 1, null, null, 1, 1, 1, 1, 0.0, 1, 1.0]
+  - ["US", 1442048400000, -466, -466, null, 1442052000000, -466, 4001, 1, 1, 0.0, 1, 0.041666666666666664]
+  - ["US", 1442052000000, -2, -468, null, 1442016000000, -466, 4001, 1, 2, 0.043478260869565216, 2, 0.08333333333333333]
+  - ["US", 1442016000000, 0, -468, 1442048400000, 1442059200000, -466, 4001, 1, 3, 0.08695652173913043, 3, 0.125]
+  - ["US", 1442059200000, 11, -457, 1442052000000, 1442062800000, -466, 4001, 1, 4, 0.13043478260869565, 4, 0.16666666666666666]
+  - ["US", 1442062800000, 47, -410, 1442016000000, 1442044800000, -466, 4001, 1, 5, 0.17391304347826086, 5, 0.20833333333333334]
+  - ["US", 1442044800000, 139, -271, 1442059200000, 1442055600000, -466, 4001, 1, 6, 0.21739130434782608, 6, 0.25]
+  - ["US", 1442055600000, 156, -115, 1442062800000, 1442095200000, -466, 4001, 1, 7, 0.2608695652173913, 7, 0.2916666666666667]
+  - ["US", 1442095200000, 416, 301, 1442044800000, 1442066400000, -466, 4001, 1, 8, 0.30434782608695654, 8, 0.3333333333333333]
+  - ["US", 1442066400000, 772, 1073, 1442055600000, 1442019600000, -466, 4001, 2, 9, 0.34782608695652173, 9, 0.375]
+  - ["US", 1442019600000, 1043, 2116, 1442095200000, 1442073600000, -466, 4001, 2, 10, 0.391304347826087, 10, 0.4166666666666667]
+  - ["US", 1442073600000, 1100, 3216, 1442066400000, 1442026800000, -466, 4001, 2, 11, 0.43478260869565216, 11, 0.4583333333333333]
+  - ["US", 1442026800000, 1512, 4728, 1442019600000, 1442088000000, -466, 4001, 2, 12, 0.4782608695652174, 12, 0.5]
+  - ["US", 1442088000000, 1691, 6419, 1442073600000, 1442041200000, -466, 4001, 2, 13, 0.5217391304347826, 13, 0.5416666666666666]
+  - ["US", 1442041200000, 1999, 8418, 1442026800000, 1442030400000, -466, 4001, 2, 14, 0.5652173913043478, 14, 0.5833333333333334]
+  - ["US", 1442030400000, 2023, 10441, 1442088000000, 1442077200000, -466, 4001, 2, 15, 0.6086956521739131, 15, 0.625]
+  - ["US", 1442077200000, 2168, 12609, 1442041200000, 1442091600000, -466, 4001, 2, 16, 0.6521739130434783, 16, 0.6666666666666666]
+  - ["US", 1442091600000, 2502, 15111, 1442030400000, 1442084400000, -466, 4001, 3, 17, 0.6956521739130435, 17, 0.7083333333333334]
+  - ["US", 1442084400000, 2523, 17634, 1442077200000, 1442023200000, -466, 4001, 3, 18, 0.7391304347826086, 18, 0.75]
+  - ["US", 1442023200000, 2844, 20478, 1442091600000, 1442070000000, -466, 4001, 3, 19, 0.782608695652174, 19, 0.7916666666666666]
+  - ["US", 1442070000000, 3505, 23983, 1442084400000, 1442098800000, -466, 4001, 3, 20, 0.8260869565217391, 20, 0.8333333333333334]
+  - ["US", 1442098800000, 3575, 27558, 1442023200000, 1442034000000, -466, 4001, 3, 21, 0.8695652173913043, 21, 0.875]
+  - ["US", 1442034000000, 3648, 31206, 1442070000000, 1442037600000, -466, 4001, 3, 22, 0.9130434782608695, 22, 0.9166666666666666]
+  - ["US", 1442037600000, 3675, 34881, 1442098800000, 1442080800000, -466, 4001, 3, 23, 0.9565217391304348, 23, 0.9583333333333334]
+  - ["US", 1442080800000, 4001, 38882, 1442034000000, null, -466, 4001, 3, 24, 1.0, 24, 1.0]
+  - ["UY", 1442073600000, -42, -42, null, 1442037600000, -42, 517, 1, 1, 0.0, 1, 0.14285714285714285]
+  - ["UY", 1442037600000, 1, -41, null, 1442077200000, -42, 517, 1, 2, 0.16666666666666666, 2, 0.2857142857142857]
+  - ["UY", 1442077200000, 23, -18, 1442073600000, 1442026800000, -42, 517, 1, 3, 0.3333333333333333, 3, 0.42857142857142855]
+  - ["UY", 1442026800000, 76, 58, 1442037600000, 1442019600000, -42, 517, 2, 4, 0.5, 4, 0.5714285714285714]
+  - ["UY", 1442019600000, 77, 135, 1442077200000, 1442070000000, -42, 517, 2, 5, 0.6666666666666666, 5, 0.7142857142857143]
+  - ["UY", 1442070000000, 284, 419, 1442026800000, 1442023200000, -42, 517, 3, 6, 0.8333333333333334, 6, 0.8571428571428571]
+  - ["UY", 1442023200000, 517, 936, 1442019600000, null, -42, 517, 3, 7, 1.0, 7, 1.0]
+  - ["UZ", 1442044800000, 1369, 1369, null, null, 1369, 1369, 1, 1, 0.0, 1, 1.0]
+  - ["VE", 1442026800000, -17, -17, null, 1442034000000, -17, 420, 1, 1, 0.0, 1, 0.1]
+  - ["VE", 1442034000000, -2, -19, null, 1442098800000, -17, 420, 1, 2, 0.1111111111111111, 2, 0.2]
+  - ["VE", 1442098800000, 9, -10, 1442026800000, 1442066400000, -17, 420, 1, 3, 0.2222222222222222, 3, 0.3]
+  - ["VE", 1442066400000, 18, 8, 1442034000000, 1442095200000, -17, 420, 1, 4, 0.3333333333333333, 4, 0.4]
+  - ["VE", 1442095200000, 35, 43, 1442098800000, 1442030400000, -17, 420, 2, 5, 0.4444444444444444, 5, 0.5]
+  - ["VE", 1442030400000, 51, 94, 1442066400000, 1442084400000, -17, 420, 2, 6, 0.5555555555555556, 6, 0.6]
+  - ["VE", 1442084400000, 60, 154, 1442095200000, 1442023200000, -17, 420, 2, 7, 0.6666666666666666, 7, 0.7]
+  - ["VE", 1442023200000, 115, 269, 1442030400000, 1442077200000, -17, 420, 3, 8, 0.7777777777777778, 8, 0.8]
+  - ["VE", 1442077200000, 412, 681, 1442084400000, 1442070000000, -17, 420, 3, 9, 0.8888888888888888, 9, 0.9]
+  - ["VE", 1442070000000, 420, 1101, 1442023200000, null, -17, 420, 3, 10, 1.0, 10, 1.0]
+  - ["VG", 1442062800000, -238, -238, null, null, -238, -238, 1, 1, 0.0, 1, 1.0]
+  - ["VN", 1442034000000, -29, -29, null, 1442048400000, -29, 811, 1, 1, 0.0, 1, 0.07692307692307693]
+  - ["VN", 1442048400000, -15, -44, null, 1442037600000, -29, 811, 1, 2, 0.08333333333333333, 2, 0.15384615384615385]
+  - ["VN", 1442037600000, -11, -55, 1442034000000, 1442084400000, -29, 811, 1, 3, 0.16666666666666666, 3, 0.23076923076923078]
+  - ["VN", 1442084400000, -10, -65, 1442048400000, 1442023200000, -29, 811, 1, 4, 0.25, 4, 0.3076923076923077]
+  - ["VN", 1442023200000, -9, -74, 1442037600000, 1442041200000, -29, 811, 1, 5, 0.3333333333333333, 5, 0.38461538461538464]
+  - ["VN", 1442041200000, 0, -74, 1442084400000, 1442059200000, -29, 811, 2, 6, 0.4166666666666667, 6, 0.46153846153846156]
+  - ["VN", 1442059200000, 8, -66, 1442023200000, 1442055600000, -29, 811, 2, 7, 0.5, 7, 0.5384615384615384]
+  - ["VN", 1442055600000, 37, -29, 1442041200000, 1442026800000, -29, 811, 2, 8, 0.5833333333333334, 8, 0.6153846153846154]
+  - ["VN", 1442026800000, 63, 34, 1442059200000, 1442052000000, -29, 811, 2, 9, 0.6666666666666666, 9, 0.6923076923076923]
+  - ["VN", 1442052000000, 90, 124, 1442055600000, 1442062800000, -29, 811, 3, 10, 0.75, 10, 0.7692307692307693]
+  - ["VN", 1442062800000, 146, 270, 1442026800000, 1442070000000, -29, 811, 3, 11, 0.8333333333333334, 11, 0.8461538461538461]
+  - ["VN", 1442070000000, 479, 749, 1442052000000, 1442066400000, -29, 811, 3, 12, 0.9166666666666666, 12, 0.9230769230769231]
+  - ["VN", 1442066400000, 811, 1560, 1442062800000, null, -29, 811, 3, 13, 1.0, 13, 1.0]
+  - ["ZA", 1442034000000, -3, -3, null, 1442070000000, -3, 79, 1, 1, 0.0, 1, 0.2]
+  - ["ZA", 1442070000000, 0, -3, null, 1442091600000, -3, 79, 1, 2, 0.25, 2, 0.4]
+  - ["ZA", 1442091600000, 1, -2, 1442034000000, 1442059200000, -3, 79, 2, 3, 0.5, 3, 0.6]
+  - ["ZA", 1442059200000, 50, 48, 1442070000000, 1442048400000, -3, 79, 2, 4, 0.75, 4, 0.8]
+  - ["ZA", 1442048400000, 79, 127, 1442091600000, null, -3, 79, 3, 5, 1.0, 5, 1.0]
+  - ["ZM", 1442041200000, 133, 133, null, null, 133, 133, 1, 1, 0.0, 1, 1.0]
+  - ["ZW", 1442044800000, 0, 0, null, 1442048400000, 0, 254, 1, 1, 0.0, 1, 0.5]
+  - ["ZW", 1442048400000, 254, 254, null, null, 0, 254, 2, 2, 1.0, 2, 1.0]
\ No newline at end of file
diff --git a/sql/src/test/resources/calcite/tests/window/wikipediaSimplePartition.sqlTest b/sql/src/test/resources/calcite/tests/window/wikipediaSimplePartition.sqlTest
new file mode 100644
index 000000000000..418959469535
--- /dev/null
+++ b/sql/src/test/resources/calcite/tests/window/wikipediaSimplePartition.sqlTest
@@ -0,0 +1,1019 @@
+type: "operatorValidation"
+
+sql: "
+    SELECT
+      countryIsoCode, 
+      FLOOR(__time TO HOUR) t, 
+      SUM(delta) delta, 
+      SUM(SUM(delta)) OVER (PARTITION BY countryIsoCode) totalDelta, 
+      LAG(FLOOR(__time TO HOUR),  2) OVER (PARTITION BY countryIsoCode) laggardTime, 
+      LEAD(FLOOR(__time TO HOUR),  1) OVER (PARTITION BY countryIsoCode) leadTime, 
+      FIRST_VALUE(SUM(delta)) OVER (PARTITION BY countryIsoCode) AS firstDelay, 
+      LAST_VALUE(SUM(delta)) OVER (PARTITION BY countryIsoCode) AS lastDelay, 
+      NTILE(3) OVER (PARTITION BY countryIsoCode) AS delayNTile
+    FROM wikipedia
+    GROUP BY 1, 2"
+
+expectedOperators:
+  - { type: "naivePartition",  partitionColumns: ["d0"] }
+  - type: "window"
+    processor:
+      type: "composing"
+      processors:
+       - { "type":"offset", "inputColumn":"d1", "outputColumn":"w1", "offset":-2 }
+       - { "type":"offset", "inputColumn":"d1", "outputColumn":"w2", "offset":1 }
+       - { "type":"first", "inputColumn":"a0", "outputColumn":"w3" }
+       - { "type":"last", "inputColumn":"a0", "outputColumn":"w4" }
+       - { "type": "percentile", "outputColumn": "w5", "numBuckets": 3 }
+       - type: "aggregate"
+         aggregations:
+         - { "type":"longSum", "name":"w0", "fieldName":"a0" }
+
+expectedResults:
+  - ["", 1442016000000, 29873, 8414700, null, 1442019600000, 29873, 276159, 1]
+  - ["", 1442019600000, 173892, 8414700, null, 1442023200000, 29873, 276159, 1]
+  - ["", 1442023200000, 399636, 8414700, 1442016000000, 1442026800000, 29873, 276159, 1]
+  - ["", 1442026800000, 252626, 8414700, 1442019600000, 1442030400000, 29873, 276159, 1]
+  - ["", 1442030400000, 166672, 8414700, 1442023200000, 1442034000000, 29873, 276159, 1]
+  - ["", 1442034000000, 330957, 8414700, 1442026800000, 1442037600000, 29873, 276159, 1]
+  - ["", 1442037600000, 200605, 8414700, 1442030400000, 1442041200000, 29873, 276159, 1]
+  - ["", 1442041200000, 543450, 8414700, 1442034000000, 1442044800000, 29873, 276159, 1]
+  - ["", 1442044800000, 316002, 8414700, 1442037600000, 1442048400000, 29873, 276159, 2]
+  - ["", 1442048400000, 308316, 8414700, 1442041200000, 1442052000000, 29873, 276159, 2]
+  - ["", 1442052000000, 787370, 8414700, 1442044800000, 1442055600000, 29873, 276159, 2]
+  - ["", 1442055600000, 283958, 8414700, 1442048400000, 1442059200000, 29873, 276159, 2]
+  - ["", 1442059200000, 459297, 8414700, 1442052000000, 1442062800000, 29873, 276159, 2]
+  - ["", 1442062800000, 389465, 8414700, 1442055600000, 1442066400000, 29873, 276159, 2]
+  - ["", 1442066400000, 351584, 8414700, 1442059200000, 1442070000000, 29873, 276159, 2]
+  - ["", 1442070000000, 358515, 8414700, 1442062800000, 1442073600000, 29873, 276159, 2]
+  - ["", 1442073600000, 375394, 8414700, 1442066400000, 1442077200000, 29873, 276159, 3]
+  - ["", 1442077200000, 392483, 8414700, 1442070000000, 1442080800000, 29873, 276159, 3]
+  - ["", 1442080800000, 453077, 8414700, 1442073600000, 1442084400000, 29873, 276159, 3]
+  - ["", 1442084400000, 372569, 8414700, 1442077200000, 1442088000000, 29873, 276159, 3]
+  - ["", 1442088000000, 303872, 8414700, 1442080800000, 1442091600000, 29873, 276159, 3]
+  - ["", 1442091600000, 514427, 8414700, 1442084400000, 1442095200000, 29873, 276159, 3]
+  - ["", 1442095200000, 374501, 8414700, 1442088000000, 1442098800000, 29873, 276159, 3]
+  - ["", 1442098800000, 276159, 8414700, 1442091600000, null, 29873, 276159, 3]
+  - ["AE", 1442030400000, 118, 6547, null, 1442044800000, 118, 42, 1]
+  - ["AE", 1442044800000, -7, 6547, null, 1442048400000, 118, 42, 1]
+  - ["AE", 1442048400000, 39, 6547, 1442030400000, 1442052000000, 118, 42, 1]
+  - ["AE", 1442052000000, -3, 6547, 1442044800000, 1442059200000, 118, 42, 2]
+  - ["AE", 1442059200000, -11, 6547, 1442048400000, 1442070000000, 118, 42, 2]
+  - ["AE", 1442070000000, 46, 6547, 1442052000000, 1442077200000, 118, 42, 2]
+  - ["AE", 1442077200000, 6323, 6547, 1442059200000, 1442080800000, 118, 42, 3]
+  - ["AE", 1442080800000, 42, 6547, 1442070000000, null, 118, 42, 3]
+  - ["AL", 1442077200000, 26, 80, null, 1442091600000, 26, 54, 1]
+  - ["AL", 1442091600000, 54, 80, null, null, 26, 54, 2]
+  - ["AO", 1442041200000, -26, 740, null, 1442052000000, -26, 722, 1]
+  - ["AO", 1442052000000, -18, 740, null, 1442088000000, -26, 722, 1]
+  - ["AO", 1442088000000, 62, 740, 1442041200000, 1442098800000, -26, 722, 2]
+  - ["AO", 1442098800000, 722, 740, 1442052000000, null, -26, 722, 3]
+  - ["AR", 1442019600000, 1, 4450, null, 1442023200000, 1, 64, 1]
+  - ["AR", 1442023200000, 2514, 4450, null, 1442026800000, 1, 64, 1]
+  - ["AR", 1442026800000, 644, 4450, 1442019600000, 1442030400000, 1, 64, 1]
+  - ["AR", 1442030400000, -3, 4450, 1442023200000, 1442034000000, 1, 64, 1]
+  - ["AR", 1442034000000, 212, 4450, 1442026800000, 1442037600000, 1, 64, 1]
+  - ["AR", 1442037600000, 81, 4450, 1442030400000, 1442055600000, 1, 64, 1]
+  - ["AR", 1442055600000, -54, 4450, 1442034000000, 1442059200000, 1, 64, 2]
+  - ["AR", 1442059200000, 210, 4450, 1442037600000, 1442062800000, 1, 64, 2]
+  - ["AR", 1442062800000, 29, 4450, 1442055600000, 1442066400000, 1, 64, 2]
+  - ["AR", 1442066400000, 0, 4450, 1442059200000, 1442070000000, 1, 64, 2]
+  - ["AR", 1442070000000, 377, 4450, 1442062800000, 1442077200000, 1, 64, 2]
+  - ["AR", 1442077200000, -591, 4450, 1442066400000, 1442080800000, 1, 64, 2]
+  - ["AR", 1442080800000, 1, 4450, 1442070000000, 1442084400000, 1, 64, 3]
+  - ["AR", 1442084400000, -5, 4450, 1442077200000, 1442091600000, 1, 64, 3]
+  - ["AR", 1442091600000, 340, 4450, 1442080800000, 1442095200000, 1, 64, 3]
+  - ["AR", 1442095200000, 630, 4450, 1442084400000, 1442098800000, 1, 64, 3]
+  - ["AR", 1442098800000, 64, 4450, 1442091600000, null, 1, 64, 3]
+  - ["AT", 1442052000000, 4793, 12047, null, 1442062800000, 4793, 89, 1]
+  - ["AT", 1442062800000, -155, 12047, null, 1442066400000, 4793, 89, 1]
+  - ["AT", 1442066400000, 0, 12047, 1442052000000, 1442070000000, 4793, 89, 1]
+  - ["AT", 1442070000000, 272, 12047, 1442062800000, 1442084400000, 4793, 89, 2]
+  - ["AT", 1442084400000, -2, 12047, 1442066400000, 1442088000000, 4793, 89, 2]
+  - ["AT", 1442088000000, 7050, 12047, 1442070000000, 1442091600000, 4793, 89, 3]
+  - ["AT", 1442091600000, 89, 12047, 1442084400000, null, 4793, 89, 3]
+  - ["AU", 1442016000000, 0, 2700, null, 1442019600000, 0, 518, 1]
+  - ["AU", 1442019600000, 253, 2700, null, 1442023200000, 0, 518, 1]
+  - ["AU", 1442023200000, 52, 2700, 1442016000000, 1442026800000, 0, 518, 1]
+  - ["AU", 1442026800000, 188, 2700, 1442019600000, 1442030400000, 0, 518, 1]
+  - ["AU", 1442030400000, -377, 2700, 1442023200000, 1442034000000, 0, 518, 1]
+  - ["AU", 1442034000000, 283, 2700, 1442026800000, 1442037600000, 0, 518, 1]
+  - ["AU", 1442037600000, 3, 2700, 1442030400000, 1442041200000, 0, 518, 1]
+  - ["AU", 1442041200000, 194, 2700, 1442034000000, 1442044800000, 0, 518, 2]
+  - ["AU", 1442044800000, 373, 2700, 1442037600000, 1442048400000, 0, 518, 2]
+  - ["AU", 1442048400000, 135, 2700, 1442041200000, 1442052000000, 0, 518, 2]
+  - ["AU", 1442052000000, -643, 2700, 1442044800000, 1442055600000, 0, 518, 2]
+  - ["AU", 1442055600000, 182, 2700, 1442048400000, 1442059200000, 0, 518, 2]
+  - ["AU", 1442059200000, 38, 2700, 1442052000000, 1442066400000, 0, 518, 2]
+  - ["AU", 1442066400000, -21, 2700, 1442055600000, 1442070000000, 0, 518, 3]
+  - ["AU", 1442070000000, -12, 2700, 1442059200000, 1442077200000, 0, 518, 3]
+  - ["AU", 1442077200000, 1, 2700, 1442066400000, 1442091600000, 0, 518, 3]
+  - ["AU", 1442091600000, 1138, 2700, 1442070000000, 1442095200000, 0, 518, 3]
+  - ["AU", 1442095200000, 395, 2700, 1442077200000, 1442098800000, 0, 518, 3]
+  - ["AU", 1442098800000, 518, 2700, 1442091600000, null, 0, 518, 3]
+  - ["BA", 1442048400000, -13, -178, null, 1442052000000, -13, -1, 1]
+  - ["BA", 1442052000000, 38, -178, null, 1442055600000, -13, -1, 1]
+  - ["BA", 1442055600000, -202, -178, 1442048400000, 1442084400000, -13, -1, 2]
+  - ["BA", 1442084400000, -1, -178, 1442052000000, null, -13, -1, 3]
+  - ["BD", 1442019600000, 0, 1106, null, 1442041200000, 0, -2, 1]
+  - ["BD", 1442041200000, 854, 1106, null, 1442066400000, 0, -2, 1]
+  - ["BD", 1442066400000, 76, 1106, 1442019600000, 1442073600000, 0, -2, 2]
+  - ["BD", 1442073600000, 103, 1106, 1442041200000, 1442077200000, 0, -2, 2]
+  - ["BD", 1442077200000, 75, 1106, 1442066400000, 1442091600000, 0, -2, 3]
+  - ["BD", 1442091600000, -2, 1106, 1442073600000, null, 0, -2, 3]
+  - ["BE", 1442030400000, -103, 795, null, 1442048400000, -103, 9, 1]
+  - ["BE", 1442048400000, 59, 795, null, 1442052000000, -103, 9, 1]
+  - ["BE", 1442052000000, -1, 795, 1442030400000, 1442055600000, -103, 9, 1]
+  - ["BE", 1442055600000, 233, 795, 1442048400000, 1442062800000, -103, 9, 1]
+  - ["BE", 1442062800000, 91, 795, 1442052000000, 1442066400000, -103, 9, 2]
+  - ["BE", 1442066400000, 136, 795, 1442055600000, 1442073600000, -103, 9, 2]
+  - ["BE", 1442073600000, 19, 795, 1442062800000, 1442080800000, -103, 9, 2]
+  - ["BE", 1442080800000, 1, 795, 1442066400000, 1442084400000, -103, 9, 2]
+  - ["BE", 1442084400000, 183, 795, 1442073600000, 1442088000000, -103, 9, 3]
+  - ["BE", 1442088000000, 67, 795, 1442080800000, 1442091600000, -103, 9, 3]
+  - ["BE", 1442091600000, 101, 795, 1442084400000, 1442098800000, -103, 9, 3]
+  - ["BE", 1442098800000, 9, 795, 1442088000000, null, -103, 9, 3]
+  - ["BG", 1442041200000, 9, 19592, null, 1442052000000, 9, 401, 1]
+  - ["BG", 1442052000000, 18936, 19592, null, 1442059200000, 9, 401, 1]
+  - ["BG", 1442059200000, 191, 19592, 1442041200000, 1442070000000, 9, 401, 2]
+  - ["BG", 1442070000000, 55, 19592, 1442052000000, 1442084400000, 9, 401, 2]
+  - ["BG", 1442084400000, 401, 19592, 1442059200000, null, 9, 401, 3]
+  - ["BH", 1442052000000, 44, 44, null, null, 44, 44, 1]
+  - ["BO", 1442080800000, 4, 4, null, 1442088000000, 4, -4, 1]
+  - ["BO", 1442088000000, 4, 4, null, 1442095200000, 4, -4, 2]
+  - ["BO", 1442095200000, -4, 4, 1442080800000, null, 4, -4, 3]
+  - ["BR", 1442016000000, -248, 8550, null, 1442019600000, -248, -645, 1]
+  - ["BR", 1442019600000, 372, 8550, null, 1442023200000, -248, -645, 1]
+  - ["BR", 1442023200000, 879, 8550, 1442016000000, 1442026800000, -248, -645, 1]
+  - ["BR", 1442026800000, 51, 8550, 1442019600000, 1442030400000, -248, -645, 1]
+  - ["BR", 1442030400000, 30, 8550, 1442023200000, 1442034000000, -248, -645, 1]
+  - ["BR", 1442034000000, 21, 8550, 1442026800000, 1442037600000, -248, -645, 1]
+  - ["BR", 1442037600000, 267, 8550, 1442030400000, 1442041200000, -248, -645, 1]
+  - ["BR", 1442041200000, 3, 8550, 1442034000000, 1442044800000, -248, -645, 1]
+  - ["BR", 1442044800000, 71, 8550, 1442037600000, 1442052000000, -248, -645, 2]
+  - ["BR", 1442052000000, 232, 8550, 1442041200000, 1442055600000, -248, -645, 2]
+  - ["BR", 1442055600000, 242, 8550, 1442044800000, 1442059200000, -248, -645, 2]
+  - ["BR", 1442059200000, 73, 8550, 1442052000000, 1442062800000, -248, -645, 2]
+  - ["BR", 1442062800000, 93, 8550, 1442055600000, 1442066400000, -248, -645, 2]
+  - ["BR", 1442066400000, 1034, 8550, 1442059200000, 1442070000000, -248, -645, 2]
+  - ["BR", 1442070000000, 536, 8550, 1442062800000, 1442073600000, -248, -645, 2]
+  - ["BR", 1442073600000, 2087, 8550, 1442066400000, 1442077200000, -248, -645, 2]
+  - ["BR", 1442077200000, 2253, 8550, 1442070000000, 1442080800000, -248, -645, 3]
+  - ["BR", 1442080800000, -267, 8550, 1442073600000, 1442084400000, -248, -645, 3]
+  - ["BR", 1442084400000, 492, 8550, 1442077200000, 1442088000000, -248, -645, 3]
+  - ["BR", 1442088000000, 215, 8550, 1442080800000, 1442091600000, -248, -645, 3]
+  - ["BR", 1442091600000, 11, 8550, 1442084400000, 1442095200000, -248, -645, 3]
+  - ["BR", 1442095200000, 748, 8550, 1442088000000, 1442098800000, -248, -645, 3]
+  - ["BR", 1442098800000, -645, 8550, 1442091600000, null, -248, -645, 3]
+  - ["BY", 1442055600000, 1, 2153, null, 1442059200000, 1, 33, 1]
+  - ["BY", 1442059200000, 1464, 2153, null, 1442073600000, 1, 33, 1]
+  - ["BY", 1442073600000, 596, 2153, 1442055600000, 1442077200000, 1, 33, 1]
+  - ["BY", 1442077200000, 30, 2153, 1442059200000, 1442080800000, 1, 33, 2]
+  - ["BY", 1442080800000, 28, 2153, 1442073600000, 1442084400000, 1, 33, 2]
+  - ["BY", 1442084400000, 1, 2153, 1442077200000, 1442088000000, 1, 33, 3]
+  - ["BY", 1442088000000, 33, 2153, 1442080800000, null, 1, 33, 3]
+  - ["CA", 1442016000000, -371, 8544, null, 1442019600000, -371, 164, 1]
+  - ["CA", 1442019600000, 2184, 8544, null, 1442023200000, -371, 164, 1]
+  - ["CA", 1442023200000, 286, 8544, 1442016000000, 1442026800000, -371, 164, 1]
+  - ["CA", 1442026800000, 2216, 8544, 1442019600000, 1442030400000, -371, 164, 1]
+  - ["CA", 1442030400000, -47, 8544, 1442023200000, 1442034000000, -371, 164, 1]
+  - ["CA", 1442034000000, 178, 8544, 1442026800000, 1442037600000, -371, 164, 1]
+  - ["CA", 1442037600000, -132, 8544, 1442030400000, 1442041200000, -371, 164, 1]
+  - ["CA", 1442041200000, 5, 8544, 1442034000000, 1442044800000, -371, 164, 1]
+  - ["CA", 1442044800000, 1, 8544, 1442037600000, 1442052000000, -371, 164, 2]
+  - ["CA", 1442052000000, 38, 8544, 1442041200000, 1442059200000, -371, 164, 2]
+  - ["CA", 1442059200000, 1036, 8544, 1442044800000, 1442062800000, -371, 164, 2]
+  - ["CA", 1442062800000, -367, 8544, 1442052000000, 1442066400000, -371, 164, 2]
+  - ["CA", 1442066400000, 307, 8544, 1442059200000, 1442070000000, -371, 164, 2]
+  - ["CA", 1442070000000, 185, 8544, 1442062800000, 1442073600000, -371, 164, 2]
+  - ["CA", 1442073600000, 86, 8544, 1442066400000, 1442077200000, -371, 164, 2]
+  - ["CA", 1442077200000, -282, 8544, 1442070000000, 1442080800000, -371, 164, 3]
+  - ["CA", 1442080800000, 481, 8544, 1442073600000, 1442084400000, -371, 164, 3]
+  - ["CA", 1442084400000, 44, 8544, 1442077200000, 1442088000000, -371, 164, 3]
+  - ["CA", 1442088000000, 35, 8544, 1442080800000, 1442091600000, -371, 164, 3]
+  - ["CA", 1442091600000, 2858, 8544, 1442084400000, 1442095200000, -371, 164, 3]
+  - ["CA", 1442095200000, -361, 8544, 1442088000000, 1442098800000, -371, 164, 3]
+  - ["CA", 1442098800000, 164, 8544, 1442091600000, null, -371, 164, 3]
+  - ["CH", 1442037600000, 59, 753, null, 1442041200000, 59, 67, 1]
+  - ["CH", 1442041200000, 198, 753, null, 1442044800000, 59, 67, 1]
+  - ["CH", 1442044800000, -54, 753, 1442037600000, 1442048400000, 59, 67, 1]
+  - ["CH", 1442048400000, 24, 753, 1442041200000, 1442052000000, 59, 67, 1]
+  - ["CH", 1442052000000, 47, 753, 1442044800000, 1442055600000, 59, 67, 2]
+  - ["CH", 1442055600000, 0, 753, 1442048400000, 1442062800000, 59, 67, 2]
+  - ["CH", 1442062800000, 22, 753, 1442052000000, 1442070000000, 59, 67, 2]
+  - ["CH", 1442070000000, 11, 753, 1442055600000, 1442073600000, 59, 67, 2]
+  - ["CH", 1442073600000, 360, 753, 1442062800000, 1442077200000, 59, 67, 3]
+  - ["CH", 1442077200000, 6, 753, 1442070000000, 1442084400000, 59, 67, 3]
+  - ["CH", 1442084400000, 13, 753, 1442073600000, 1442091600000, 59, 67, 3]
+  - ["CH", 1442091600000, 67, 753, 1442077200000, null, 59, 67, 3]
+  - ["CL", 1442016000000, 161, 533, null, 1442019600000, 161, 9, 1]
+  - ["CL", 1442019600000, -370, 533, null, 1442023200000, 161, 9, 1]
+  - ["CL", 1442023200000, 15, 533, 1442016000000, 1442030400000, 161, 9, 1]
+  - ["CL", 1442030400000, 40, 533, 1442019600000, 1442034000000, 161, 9, 1]
+  - ["CL", 1442034000000, -1, 533, 1442023200000, 1442037600000, 161, 9, 1]
+  - ["CL", 1442037600000, 2, 533, 1442030400000, 1442041200000, 161, 9, 1]
+  - ["CL", 1442041200000, -1, 533, 1442034000000, 1442052000000, 161, 9, 1]
+  - ["CL", 1442052000000, 390, 533, 1442037600000, 1442059200000, 161, 9, 2]
+  - ["CL", 1442059200000, -12, 533, 1442041200000, 1442062800000, 161, 9, 2]
+  - ["CL", 1442062800000, 17, 533, 1442052000000, 1442066400000, 161, 9, 2]
+  - ["CL", 1442066400000, -41, 533, 1442059200000, 1442070000000, 161, 9, 2]
+  - ["CL", 1442070000000, 13, 533, 1442062800000, 1442073600000, 161, 9, 2]
+  - ["CL", 1442073600000, 153, 533, 1442066400000, 1442077200000, 161, 9, 2]
+  - ["CL", 1442077200000, -15, 533, 1442070000000, 1442080800000, 161, 9, 2]
+  - ["CL", 1442080800000, 17, 533, 1442073600000, 1442084400000, 161, 9, 3]
+  - ["CL", 1442084400000, 126, 533, 1442077200000, 1442088000000, 161, 9, 3]
+  - ["CL", 1442088000000, 286, 533, 1442080800000, 1442091600000, 161, 9, 3]
+  - ["CL", 1442091600000, 20, 533, 1442084400000, 1442095200000, 161, 9, 3]
+  - ["CL", 1442095200000, -276, 533, 1442088000000, 1442098800000, 161, 9, 3]
+  - ["CL", 1442098800000, 9, 533, 1442091600000, null, 161, 9, 3]
+  - ["CN", 1442023200000, -13, 583, null, 1442026800000, -13, -1, 1]
+  - ["CN", 1442026800000, 154, 583, null, 1442037600000, -13, -1, 1]
+  - ["CN", 1442037600000, 98, 583, 1442023200000, 1442048400000, -13, -1, 1]
+  - ["CN", 1442048400000, 293, 583, 1442026800000, 1442052000000, -13, -1, 1]
+  - ["CN", 1442052000000, 0, 583, 1442037600000, 1442055600000, -13, -1, 2]
+  - ["CN", 1442055600000, 69, 583, 1442048400000, 1442059200000, -13, -1, 2]
+  - ["CN", 1442059200000, 8, 583, 1442052000000, 1442066400000, -13, -1, 2]
+  - ["CN", 1442066400000, -15, 583, 1442055600000, 1442080800000, -13, -1, 3]
+  - ["CN", 1442080800000, -10, 583, 1442059200000, 1442084400000, -13, -1, 3]
+  - ["CN", 1442084400000, -1, 583, 1442066400000, null, -13, -1, 3]
+  - ["CO", 1442016000000, 16, 59611, null, 1442019600000, 16, 83, 1]
+  - ["CO", 1442019600000, 12, 59611, null, 1442023200000, 16, 83, 1]
+  - ["CO", 1442023200000, 9, 59611, 1442016000000, 1442030400000, 16, 83, 1]
+  - ["CO", 1442030400000, 441, 59611, 1442019600000, 1442059200000, 16, 83, 1]
+  - ["CO", 1442059200000, 473, 59611, 1442023200000, 1442066400000, 16, 83, 1]
+  - ["CO", 1442066400000, 288, 59611, 1442030400000, 1442070000000, 16, 83, 2]
+  - ["CO", 1442070000000, -45, 59611, 1442059200000, 1442073600000, 16, 83, 2]
+  - ["CO", 1442073600000, 39860, 59611, 1442066400000, 1442077200000, 16, 83, 2]
+  - ["CO", 1442077200000, 581, 59611, 1442070000000, 1442080800000, 16, 83, 2]
+  - ["CO", 1442080800000, 25, 59611, 1442073600000, 1442084400000, 16, 83, 2]
+  - ["CO", 1442084400000, 51, 59611, 1442077200000, 1442088000000, 16, 83, 3]
+  - ["CO", 1442088000000, 17150, 59611, 1442080800000, 1442091600000, 16, 83, 3]
+  - ["CO", 1442091600000, 377, 59611, 1442084400000, 1442095200000, 16, 83, 3]
+  - ["CO", 1442095200000, 290, 59611, 1442088000000, 1442098800000, 16, 83, 3]
+  - ["CO", 1442098800000, 83, 59611, 1442091600000, null, 16, 83, 3]
+  - ["CR", 1442019600000, 62, 3241, null, 1442023200000, 62, 72, 1]
+  - ["CR", 1442023200000, 62, 3241, null, 1442026800000, 62, 72, 1]
+  - ["CR", 1442026800000, 140, 3241, 1442019600000, 1442030400000, 62, 72, 1]
+  - ["CR", 1442030400000, 2497, 3241, 1442023200000, 1442041200000, 62, 72, 2]
+  - ["CR", 1442041200000, 51, 3241, 1442026800000, 1442044800000, 62, 72, 2]
+  - ["CR", 1442044800000, 194, 3241, 1442030400000, 1442048400000, 62, 72, 2]
+  - ["CR", 1442048400000, 163, 3241, 1442041200000, 1442088000000, 62, 72, 3]
+  - ["CR", 1442088000000, 72, 3241, 1442044800000, null, 62, 72, 3]
+  - ["CZ", 1442026800000, -19, 3479, null, 1442034000000, -19, 2, 1]
+  - ["CZ", 1442034000000, 78, 3479, null, 1442037600000, -19, 2, 1]
+  - ["CZ", 1442037600000, 18, 3479, 1442026800000, 1442055600000, -19, 2, 1]
+  - ["CZ", 1442055600000, 1073, 3479, 1442034000000, 1442059200000, -19, 2, 1]
+  - ["CZ", 1442059200000, 21, 3479, 1442037600000, 1442062800000, -19, 2, 2]
+  - ["CZ", 1442062800000, 0, 3479, 1442055600000, 1442070000000, -19, 2, 2]
+  - ["CZ", 1442070000000, 168, 3479, 1442059200000, 1442073600000, -19, 2, 2]
+  - ["CZ", 1442073600000, 2051, 3479, 1442062800000, 1442077200000, -19, 2, 2]
+  - ["CZ", 1442077200000, 115, 3479, 1442070000000, 1442080800000, -19, 2, 3]
+  - ["CZ", 1442080800000, -28, 3479, 1442073600000, 1442098800000, -19, 2, 3]
+  - ["CZ", 1442098800000, 2, 3479, 1442077200000, null, -19, 2, 3]
+  - ["DE", 1442016000000, 167, 25583, null, 1442019600000, 167, 329, 1]
+  - ["DE", 1442019600000, 0, 25583, null, 1442023200000, 167, 329, 1]
+  - ["DE", 1442023200000, 64, 25583, 1442016000000, 1442030400000, 167, 329, 1]
+  - ["DE", 1442030400000, 373, 25583, 1442019600000, 1442034000000, 167, 329, 1]
+  - ["DE", 1442034000000, 358, 25583, 1442023200000, 1442037600000, 167, 329, 1]
+  - ["DE", 1442037600000, 544, 25583, 1442030400000, 1442041200000, 167, 329, 1]
+  - ["DE", 1442041200000, 197, 25583, 1442034000000, 1442044800000, 167, 329, 1]
+  - ["DE", 1442044800000, 979, 25583, 1442037600000, 1442048400000, 167, 329, 1]
+  - ["DE", 1442048400000, 811, 25583, 1442041200000, 1442052000000, 167, 329, 2]
+  - ["DE", 1442052000000, 1600, 25583, 1442044800000, 1442055600000, 167, 329, 2]
+  - ["DE", 1442055600000, 1523, 25583, 1442048400000, 1442059200000, 167, 329, 2]
+  - ["DE", 1442059200000, 289, 25583, 1442052000000, 1442062800000, 167, 329, 2]
+  - ["DE", 1442062800000, 283, 25583, 1442055600000, 1442066400000, 167, 329, 2]
+  - ["DE", 1442066400000, 1577, 25583, 1442059200000, 1442070000000, 167, 329, 2]
+  - ["DE", 1442070000000, 1666, 25583, 1442062800000, 1442073600000, 167, 329, 2]
+  - ["DE", 1442073600000, 6075, 25583, 1442066400000, 1442077200000, 167, 329, 2]
+  - ["DE", 1442077200000, 2188, 25583, 1442070000000, 1442080800000, 167, 329, 3]
+  - ["DE", 1442080800000, 1133, 25583, 1442073600000, 1442084400000, 167, 329, 3]
+  - ["DE", 1442084400000, -125, 25583, 1442077200000, 1442088000000, 167, 329, 3]
+  - ["DE", 1442088000000, 190, 25583, 1442080800000, 1442091600000, 167, 329, 3]
+  - ["DE", 1442091600000, 4355, 25583, 1442084400000, 1442095200000, 167, 329, 3]
+  - ["DE", 1442095200000, 1007, 25583, 1442088000000, 1442098800000, 167, 329, 3]
+  - ["DE", 1442098800000, 329, 25583, 1442091600000, null, 167, 329, 3]
+  - ["DK", 1442037600000, 10, 594, null, 1442044800000, 10, 0, 1]
+  - ["DK", 1442044800000, 36, 594, null, 1442048400000, 10, 0, 1]
+  - ["DK", 1442048400000, -5, 594, 1442037600000, 1442055600000, 10, 0, 1]
+  - ["DK", 1442055600000, 42, 594, 1442044800000, 1442059200000, 10, 0, 1]
+  - ["DK", 1442059200000, 0, 594, 1442048400000, 1442062800000, 10, 0, 2]
+  - ["DK", 1442062800000, 1, 594, 1442055600000, 1442066400000, 10, 0, 2]
+  - ["DK", 1442066400000, 416, 594, 1442059200000, 1442077200000, 10, 0, 2]
+  - ["DK", 1442077200000, -9, 594, 1442062800000, 1442080800000, 10, 0, 2]
+  - ["DK", 1442080800000, 61, 594, 1442066400000, 1442084400000, 10, 0, 3]
+  - ["DK", 1442084400000, -97, 594, 1442077200000, 1442091600000, 10, 0, 3]
+  - ["DK", 1442091600000, 139, 594, 1442080800000, 1442095200000, 10, 0, 3]
+  - ["DK", 1442095200000, 0, 594, 1442084400000, null, 10, 0, 3]
+  - ["DO", 1442023200000, 8, 264, null, 1442066400000, 8, 13, 1]
+  - ["DO", 1442066400000, 35, 264, null, 1442073600000, 8, 13, 1]
+  - ["DO", 1442073600000, 200, 264, 1442023200000, 1442084400000, 8, 13, 2]
+  - ["DO", 1442084400000, 8, 264, 1442066400000, 1442095200000, 8, 13, 2]
+  - ["DO", 1442095200000, 13, 264, 1442073600000, null, 8, 13, 3]
+  - ["DZ", 1442077200000, -1, -1, null, null, -1, -1, 1]
+  - ["EC", 1442019600000, 29, 232, null, 1442023200000, 29, 10, 1]
+  - ["EC", 1442023200000, -9, 232, null, 1442030400000, 29, 10, 1]
+  - ["EC", 1442030400000, 0, 232, 1442019600000, 1442077200000, 29, 10, 2]
+  - ["EC", 1442077200000, -366, 232, 1442023200000, 1442084400000, 29, 10, 2]
+  - ["EC", 1442084400000, 568, 232, 1442030400000, 1442095200000, 29, 10, 3]
+  - ["EC", 1442095200000, 10, 232, 1442077200000, null, 29, 10, 3]
+  - ["EE", 1442041200000, 37, 18, null, 1442044800000, 37, -19, 1]
+  - ["EE", 1442044800000, -19, 18, null, null, 37, -19, 2]
+  - ["EG", 1442026800000, 16, 170, null, 1442055600000, 16, 27, 1]
+  - ["EG", 1442055600000, 14, 170, null, 1442062800000, 16, 27, 1]
+  - ["EG", 1442062800000, 112, 170, 1442026800000, 1442073600000, 16, 27, 2]
+  - ["EG", 1442073600000, 1, 170, 1442055600000, 1442091600000, 16, 27, 2]
+  - ["EG", 1442091600000, 27, 170, 1442062800000, null, 16, 27, 3]
+  - ["ES", 1442019600000, 103, 7449, null, 1442023200000, 103, 458, 1]
+  - ["ES", 1442023200000, -5, 7449, null, 1442034000000, 103, 458, 1]
+  - ["ES", 1442034000000, -52, 7449, 1442019600000, 1442037600000, 103, 458, 1]
+  - ["ES", 1442037600000, 3, 7449, 1442023200000, 1442041200000, 103, 458, 1]
+  - ["ES", 1442041200000, 118, 7449, 1442034000000, 1442044800000, 103, 458, 1]
+  - ["ES", 1442044800000, -169, 7449, 1442037600000, 1442048400000, 103, 458, 1]
+  - ["ES", 1442048400000, 158, 7449, 1442041200000, 1442052000000, 103, 458, 1]
+  - ["ES", 1442052000000, -4, 7449, 1442044800000, 1442055600000, 103, 458, 2]
+  - ["ES", 1442055600000, 495, 7449, 1442048400000, 1442059200000, 103, 458, 2]
+  - ["ES", 1442059200000, 1086, 7449, 1442052000000, 1442062800000, 103, 458, 2]
+  - ["ES", 1442062800000, -71, 7449, 1442055600000, 1442066400000, 103, 458, 2]
+  - ["ES", 1442066400000, 461, 7449, 1442059200000, 1442070000000, 103, 458, 2]
+  - ["ES", 1442070000000, 61, 7449, 1442062800000, 1442073600000, 103, 458, 2]
+  - ["ES", 1442073600000, 154, 7449, 1442066400000, 1442077200000, 103, 458, 2]
+  - ["ES", 1442077200000, 1240, 7449, 1442070000000, 1442084400000, 103, 458, 3]
+  - ["ES", 1442084400000, 337, 7449, 1442073600000, 1442088000000, 103, 458, 3]
+  - ["ES", 1442088000000, -130, 7449, 1442077200000, 1442091600000, 103, 458, 3]
+  - ["ES", 1442091600000, 700, 7449, 1442084400000, 1442095200000, 103, 458, 3]
+  - ["ES", 1442095200000, 2506, 7449, 1442088000000, 1442098800000, 103, 458, 3]
+  - ["ES", 1442098800000, 458, 7449, 1442091600000, null, 103, 458, 3]
+  - ["FI", 1442030400000, 1491, 3579, null, 1442037600000, 1491, 69, 1]
+  - ["FI", 1442037600000, 14, 3579, null, 1442048400000, 1491, 69, 1]
+  - ["FI", 1442048400000, 12, 3579, 1442030400000, 1442052000000, 1491, 69, 1]
+  - ["FI", 1442052000000, 186, 3579, 1442037600000, 1442059200000, 1491, 69, 1]
+  - ["FI", 1442059200000, 407, 3579, 1442048400000, 1442062800000, 1491, 69, 2]
+  - ["FI", 1442062800000, 19, 3579, 1442052000000, 1442066400000, 1491, 69, 2]
+  - ["FI", 1442066400000, 183, 3579, 1442059200000, 1442073600000, 1491, 69, 2]
+  - ["FI", 1442073600000, -1, 3579, 1442062800000, 1442077200000, 1491, 69, 2]
+  - ["FI", 1442077200000, 200, 3579, 1442066400000, 1442080800000, 1491, 69, 3]
+  - ["FI", 1442080800000, 104, 3579, 1442073600000, 1442084400000, 1491, 69, 3]
+  - ["FI", 1442084400000, 895, 3579, 1442077200000, 1442095200000, 1491, 69, 3]
+  - ["FI", 1442095200000, 69, 3579, 1442080800000, null, 1491, 69, 3]
+  - ["FR", 1442016000000, -1, 37281, null, 1442019600000, -1, 136, 1]
+  - ["FR", 1442019600000, 585, 37281, null, 1442023200000, -1, 136, 1]
+  - ["FR", 1442023200000, 628, 37281, 1442016000000, 1442026800000, -1, 136, 1]
+  - ["FR", 1442026800000, 86, 37281, 1442019600000, 1442034000000, -1, 136, 1]
+  - ["FR", 1442034000000, 476, 37281, 1442023200000, 1442037600000, -1, 136, 1]
+  - ["FR", 1442037600000, 4174, 37281, 1442026800000, 1442041200000, -1, 136, 1]
+  - ["FR", 1442041200000, 604, 37281, 1442034000000, 1442044800000, -1, 136, 1]
+  - ["FR", 1442044800000, 172, 37281, 1442037600000, 1442048400000, -1, 136, 1]
+  - ["FR", 1442048400000, 3027, 37281, 1442041200000, 1442052000000, -1, 136, 2]
+  - ["FR", 1442052000000, 637, 37281, 1442044800000, 1442055600000, -1, 136, 2]
+  - ["FR", 1442055600000, 463, 37281, 1442048400000, 1442059200000, -1, 136, 2]
+  - ["FR", 1442059200000, 4650, 37281, 1442052000000, 1442062800000, -1, 136, 2]
+  - ["FR", 1442062800000, 5676, 37281, 1442055600000, 1442066400000, -1, 136, 2]
+  - ["FR", 1442066400000, 2516, 37281, 1442059200000, 1442070000000, -1, 136, 2]
+  - ["FR", 1442070000000, 474, 37281, 1442062800000, 1442073600000, -1, 136, 2]
+  - ["FR", 1442073600000, 3522, 37281, 1442066400000, 1442077200000, -1, 136, 2]
+  - ["FR", 1442077200000, -444, 37281, 1442070000000, 1442080800000, -1, 136, 3]
+  - ["FR", 1442080800000, 557, 37281, 1442073600000, 1442084400000, -1, 136, 3]
+  - ["FR", 1442084400000, 6643, 37281, 1442077200000, 1442088000000, -1, 136, 3]
+  - ["FR", 1442088000000, 1872, 37281, 1442080800000, 1442091600000, -1, 136, 3]
+  - ["FR", 1442091600000, 741, 37281, 1442084400000, 1442095200000, -1, 136, 3]
+  - ["FR", 1442095200000, 87, 37281, 1442088000000, 1442098800000, -1, 136, 3]
+  - ["FR", 1442098800000, 136, 37281, 1442091600000, null, -1, 136, 3]
+  - ["GB", 1442016000000, -44, 35857, null, 1442019600000, -44, 49, 1]
+  - ["GB", 1442019600000, 54, 35857, null, 1442023200000, -44, 49, 1]
+  - ["GB", 1442023200000, 1816, 35857, 1442016000000, 1442026800000, -44, 49, 1]
+  - ["GB", 1442026800000, 339, 35857, 1442019600000, 1442030400000, -44, 49, 1]
+  - ["GB", 1442030400000, 2524, 35857, 1442023200000, 1442034000000, -44, 49, 1]
+  - ["GB", 1442034000000, -12, 35857, 1442026800000, 1442037600000, -44, 49, 1]
+  - ["GB", 1442037600000, 544, 35857, 1442030400000, 1442041200000, -44, 49, 1]
+  - ["GB", 1442041200000, 42, 35857, 1442034000000, 1442044800000, -44, 49, 1]
+  - ["GB", 1442044800000, 32, 35857, 1442037600000, 1442048400000, -44, 49, 2]
+  - ["GB", 1442048400000, 740, 35857, 1442041200000, 1442052000000, -44, 49, 2]
+  - ["GB", 1442052000000, 168, 35857, 1442044800000, 1442055600000, -44, 49, 2]
+  - ["GB", 1442055600000, 453, 35857, 1442048400000, 1442059200000, -44, 49, 2]
+  - ["GB", 1442059200000, 16111, 35857, 1442052000000, 1442062800000, -44, 49, 2]
+  - ["GB", 1442062800000, 5743, 35857, 1442055600000, 1442066400000, -44, 49, 2]
+  - ["GB", 1442066400000, 671, 35857, 1442059200000, 1442070000000, -44, 49, 2]
+  - ["GB", 1442070000000, 374, 35857, 1442062800000, 1442073600000, -44, 49, 2]
+  - ["GB", 1442073600000, 648, 35857, 1442066400000, 1442077200000, -44, 49, 3]
+  - ["GB", 1442077200000, 1135, 35857, 1442070000000, 1442080800000, -44, 49, 3]
+  - ["GB", 1442080800000, 1444, 35857, 1442073600000, 1442084400000, -44, 49, 3]
+  - ["GB", 1442084400000, 384, 35857, 1442077200000, 1442088000000, -44, 49, 3]
+  - ["GB", 1442088000000, 1593, 35857, 1442080800000, 1442091600000, -44, 49, 3]
+  - ["GB", 1442091600000, 811, 35857, 1442084400000, 1442095200000, -44, 49, 3]
+  - ["GB", 1442095200000, 238, 35857, 1442088000000, 1442098800000, -44, 49, 3]
+  - ["GB", 1442098800000, 49, 35857, 1442091600000, null, -44, 49, 3]
+  - ["GE", 1442044800000, -21, -140, null, 1442052000000, -21, -27, 1]
+  - ["GE", 1442052000000, -108, -140, null, 1442062800000, -21, -27, 1]
+  - ["GE", 1442062800000, 16, -140, 1442044800000, 1442080800000, -21, -27, 2]
+  - ["GE", 1442080800000, -27, -140, 1442052000000, null, -21, -27, 3]
+  - ["GH", 1442088000000, 0, 0, null, null, 0, 0, 1]
+  - ["GR", 1442019600000, 82, 149, null, 1442034000000, 82, 123, 1]
+  - ["GR", 1442034000000, 0, 149, null, 1442041200000, 82, 123, 1]
+  - ["GR", 1442041200000, 7, 149, 1442019600000, 1442048400000, 82, 123, 1]
+  - ["GR", 1442048400000, -26, 149, 1442034000000, 1442062800000, 82, 123, 1]
+  - ["GR", 1442062800000, 8, 149, 1442041200000, 1442070000000, 82, 123, 2]
+  - ["GR", 1442070000000, 2, 149, 1442048400000, 1442073600000, 82, 123, 2]
+  - ["GR", 1442073600000, -314, 149, 1442062800000, 1442080800000, 82, 123, 2]
+  - ["GR", 1442080800000, 88, 149, 1442070000000, 1442084400000, 82, 123, 3]
+  - ["GR", 1442084400000, 179, 149, 1442073600000, 1442091600000, 82, 123, 3]
+  - ["GR", 1442091600000, 123, 149, 1442080800000, null, 82, 123, 3]
+  - ["GT", 1442023200000, -167, 7, null, 1442026800000, -167, 1, 1]
+  - ["GT", 1442026800000, 173, 7, null, 1442098800000, -167, 1, 2]
+  - ["GT", 1442098800000, 1, 7, 1442023200000, null, -167, 1, 3]
+  - ["HK", 1442019600000, -113, 10743, null, 1442023200000, -113, -1, 1]
+  - ["HK", 1442023200000, 2414, 10743, null, 1442026800000, -113, -1, 1]
+  - ["HK", 1442026800000, -211, 10743, 1442019600000, 1442030400000, -113, -1, 1]
+  - ["HK", 1442030400000, 157, 10743, 1442023200000, 1442034000000, -113, -1, 1]
+  - ["HK", 1442034000000, 1137, 10743, 1442026800000, 1442037600000, -113, -1, 1]
+  - ["HK", 1442037600000, 636, 10743, 1442030400000, 1442041200000, -113, -1, 1]
+  - ["HK", 1442041200000, -15, 10743, 1442034000000, 1442044800000, -113, -1, 1]
+  - ["HK", 1442044800000, 21, 10743, 1442037600000, 1442048400000, -113, -1, 2]
+  - ["HK", 1442048400000, 1, 10743, 1442041200000, 1442052000000, -113, -1, 2]
+  - ["HK", 1442052000000, 15, 10743, 1442044800000, 1442055600000, -113, -1, 2]
+  - ["HK", 1442055600000, 804, 10743, 1442048400000, 1442059200000, -113, -1, 2]
+  - ["HK", 1442059200000, 2, 10743, 1442052000000, 1442062800000, -113, -1, 2]
+  - ["HK", 1442062800000, 1, 10743, 1442055600000, 1442066400000, -113, -1, 2]
+  - ["HK", 1442066400000, 39, 10743, 1442059200000, 1442070000000, -113, -1, 3]
+  - ["HK", 1442070000000, 314, 10743, 1442062800000, 1442073600000, -113, -1, 3]
+  - ["HK", 1442073600000, 5545, 10743, 1442066400000, 1442080800000, -113, -1, 3]
+  - ["HK", 1442080800000, 0, 10743, 1442070000000, 1442091600000, -113, -1, 3]
+  - ["HK", 1442091600000, -3, 10743, 1442073600000, 1442095200000, -113, -1, 3]
+  - ["HK", 1442095200000, -1, 10743, 1442080800000, null, -113, -1, 3]
+  - ["HN", 1442026800000, -1, -1, null, null, -1, -1, 1]
+  - ["HR", 1442070000000, 32, 382, null, 1442073600000, 32, 82, 1]
+  - ["HR", 1442073600000, 0, 382, null, 1442077200000, 32, 82, 1]
+  - ["HR", 1442077200000, 58, 382, 1442070000000, 1442080800000, 32, 82, 2]
+  - ["HR", 1442080800000, 220, 382, 1442073600000, 1442084400000, 32, 82, 2]
+  - ["HR", 1442084400000, -10, 382, 1442077200000, 1442088000000, 32, 82, 3]
+  - ["HR", 1442088000000, 82, 382, 1442080800000, null, 32, 82, 3]
+  - ["HU", 1442019600000, 46, 2116, null, 1442037600000, 46, 110, 1]
+  - ["HU", 1442037600000, 197, 2116, null, 1442041200000, 46, 110, 1]
+  - ["HU", 1442041200000, 91, 2116, 1442019600000, 1442044800000, 46, 110, 1]
+  - ["HU", 1442044800000, 547, 2116, 1442037600000, 1442048400000, 46, 110, 1]
+  - ["HU", 1442048400000, 499, 2116, 1442041200000, 1442055600000, 46, 110, 1]
+  - ["HU", 1442055600000, -2, 2116, 1442044800000, 1442062800000, 46, 110, 2]
+  - ["HU", 1442062800000, 50, 2116, 1442048400000, 1442080800000, 46, 110, 2]
+  - ["HU", 1442080800000, 242, 2116, 1442055600000, 1442084400000, 46, 110, 2]
+  - ["HU", 1442084400000, 141, 2116, 1442062800000, 1442088000000, 46, 110, 2]
+  - ["HU", 1442088000000, -71, 2116, 1442080800000, 1442091600000, 46, 110, 3]
+  - ["HU", 1442091600000, -5, 2116, 1442084400000, 1442095200000, 46, 110, 3]
+  - ["HU", 1442095200000, 271, 2116, 1442088000000, 1442098800000, 46, 110, 3]
+  - ["HU", 1442098800000, 110, 2116, 1442091600000, null, 46, 110, 3]
+  - ["ID", 1442023200000, 106, -255, null, 1442026800000, 106, 13, 1]
+  - ["ID", 1442026800000, -416, -255, null, 1442030400000, 106, 13, 1]
+  - ["ID", 1442030400000, 279, -255, 1442023200000, 1442034000000, 106, 13, 1]
+  - ["ID", 1442034000000, 19, -255, 1442026800000, 1442037600000, 106, 13, 1]
+  - ["ID", 1442037600000, 14, -255, 1442030400000, 1442041200000, 106, 13, 1]
+  - ["ID", 1442041200000, 2, -255, 1442034000000, 1442044800000, 106, 13, 2]
+  - ["ID", 1442044800000, -388, -255, 1442037600000, 1442055600000, 106, 13, 2]
+  - ["ID", 1442055600000, 16, -255, 1442041200000, 1442059200000, 106, 13, 2]
+  - ["ID", 1442059200000, 17, -255, 1442044800000, 1442070000000, 106, 13, 2]
+  - ["ID", 1442070000000, 42, -255, 1442055600000, 1442091600000, 106, 13, 3]
+  - ["ID", 1442091600000, 21, -255, 1442059200000, 1442095200000, 106, 13, 3]
+  - ["ID", 1442095200000, 20, -255, 1442070000000, 1442098800000, 106, 13, 3]
+  - ["ID", 1442098800000, 13, -255, 1442091600000, null, 106, 13, 3]
+  - ["IE", 1442026800000, 1, 2142, null, 1442030400000, 1, -71, 1]
+  - ["IE", 1442030400000, 1, 2142, null, 1442048400000, 1, -71, 1]
+  - ["IE", 1442048400000, 27, 2142, 1442026800000, 1442066400000, 1, -71, 1]
+  - ["IE", 1442066400000, 1062, 2142, 1442030400000, 1442070000000, 1, -71, 2]
+  - ["IE", 1442070000000, -100, 2142, 1442048400000, 1442077200000, 1, -71, 2]
+  - ["IE", 1442077200000, 403, 2142, 1442066400000, 1442084400000, 1, -71, 2]
+  - ["IE", 1442084400000, 819, 2142, 1442070000000, 1442091600000, 1, -71, 3]
+  - ["IE", 1442091600000, -71, 2142, 1442077200000, null, 1, -71, 3]
+  - ["IL", 1442041200000, 35, 6617, null, 1442044800000, 35, 3, 1]
+  - ["IL", 1442044800000, 218, 6617, null, 1442048400000, 35, 3, 1]
+  - ["IL", 1442048400000, 25, 6617, 1442041200000, 1442052000000, 35, 3, 1]
+  - ["IL", 1442052000000, 2745, 6617, 1442044800000, 1442055600000, 35, 3, 1]
+  - ["IL", 1442055600000, 4, 6617, 1442048400000, 1442059200000, 35, 3, 1]
+  - ["IL", 1442059200000, 1205, 6617, 1442052000000, 1442062800000, 35, 3, 1]
+  - ["IL", 1442062800000, 180, 6617, 1442055600000, 1442066400000, 35, 3, 2]
+  - ["IL", 1442066400000, 3, 6617, 1442059200000, 1442070000000, 35, 3, 2]
+  - ["IL", 1442070000000, 49, 6617, 1442062800000, 1442073600000, 35, 3, 2]
+  - ["IL", 1442073600000, 31, 6617, 1442066400000, 1442077200000, 35, 3, 2]
+  - ["IL", 1442077200000, 187, 6617, 1442070000000, 1442080800000, 35, 3, 2]
+  - ["IL", 1442080800000, 88, 6617, 1442073600000, 1442084400000, 35, 3, 3]
+  - ["IL", 1442084400000, 1137, 6617, 1442077200000, 1442091600000, 35, 3, 3]
+  - ["IL", 1442091600000, 707, 6617, 1442080800000, 1442095200000, 35, 3, 3]
+  - ["IL", 1442095200000, 0, 6617, 1442084400000, 1442098800000, 35, 3, 3]
+  - ["IL", 1442098800000, 3, 6617, 1442091600000, null, 35, 3, 3]
+  - ["IN", 1442016000000, 1, 29166, null, 1442019600000, 1, 4, 1]
+  - ["IN", 1442019600000, 38, 29166, null, 1442023200000, 1, 4, 1]
+  - ["IN", 1442023200000, -142, 29166, 1442016000000, 1442026800000, 1, 4, 1]
+  - ["IN", 1442026800000, 974, 29166, 1442019600000, 1442030400000, 1, 4, 1]
+  - ["IN", 1442030400000, 1448, 29166, 1442023200000, 1442034000000, 1, 4, 1]
+  - ["IN", 1442034000000, 1350, 29166, 1442026800000, 1442037600000, 1, 4, 1]
+  - ["IN", 1442037600000, 135, 29166, 1442030400000, 1442041200000, 1, 4, 1]
+  - ["IN", 1442041200000, 80, 29166, 1442034000000, 1442044800000, 1, 4, 1]
+  - ["IN", 1442044800000, 2677, 29166, 1442037600000, 1442048400000, 1, 4, 2]
+  - ["IN", 1442048400000, 262, 29166, 1442041200000, 1442052000000, 1, 4, 2]
+  - ["IN", 1442052000000, 534, 29166, 1442044800000, 1442055600000, 1, 4, 2]
+  - ["IN", 1442055600000, 166, 29166, 1442048400000, 1442059200000, 1, 4, 2]
+  - ["IN", 1442059200000, 708, 29166, 1442052000000, 1442062800000, 1, 4, 2]
+  - ["IN", 1442062800000, 1547, 29166, 1442055600000, 1442066400000, 1, 4, 2]
+  - ["IN", 1442066400000, 116, 29166, 1442059200000, 1442070000000, 1, 4, 2]
+  - ["IN", 1442070000000, 12091, 29166, 1442062800000, 1442073600000, 1, 4, 3]
+  - ["IN", 1442073600000, 1170, 29166, 1442066400000, 1442077200000, 1, 4, 3]
+  - ["IN", 1442077200000, 5699, 29166, 1442070000000, 1442080800000, 1, 4, 3]
+  - ["IN", 1442080800000, 0, 29166, 1442073600000, 1442084400000, 1, 4, 3]
+  - ["IN", 1442084400000, 187, 29166, 1442077200000, 1442088000000, 1, 4, 3]
+  - ["IN", 1442088000000, 121, 29166, 1442080800000, 1442095200000, 1, 4, 3]
+  - ["IN", 1442095200000, 4, 29166, 1442084400000, null, 1, 4, 3]
+  - ["IQ", 1442041200000, -1, 3, null, 1442044800000, -1, -2, 1]
+  - ["IQ", 1442044800000, 6, 3, null, 1442052000000, -1, -2, 1]
+  - ["IQ", 1442052000000, 0, 3, 1442041200000, 1442095200000, -1, -2, 2]
+  - ["IQ", 1442095200000, -2, 3, 1442044800000, null, -1, -2, 3]
+  - ["IR", 1442026800000, 0, 2698, null, 1442030400000, 0, 0, 1]
+  - ["IR", 1442030400000, 375, 2698, null, 1442034000000, 0, 0, 1]
+  - ["IR", 1442034000000, -8, 2698, 1442026800000, 1442041200000, 0, 0, 1]
+  - ["IR", 1442041200000, -79, 2698, 1442030400000, 1442044800000, 0, 0, 1]
+  - ["IR", 1442044800000, 306, 2698, 1442034000000, 1442052000000, 0, 0, 1]
+  - ["IR", 1442052000000, 155, 2698, 1442041200000, 1442055600000, 0, 0, 2]
+  - ["IR", 1442055600000, -124, 2698, 1442044800000, 1442059200000, 0, 0, 2]
+  - ["IR", 1442059200000, 1455, 2698, 1442052000000, 1442073600000, 0, 0, 2]
+  - ["IR", 1442073600000, -193, 2698, 1442055600000, 1442077200000, 0, 0, 2]
+  - ["IR", 1442077200000, -34, 2698, 1442059200000, 1442080800000, 0, 0, 3]
+  - ["IR", 1442080800000, 131, 2698, 1442073600000, 1442088000000, 0, 0, 3]
+  - ["IR", 1442088000000, 714, 2698, 1442077200000, 1442091600000, 0, 0, 3]
+  - ["IR", 1442091600000, 0, 2698, 1442080800000, null, 0, 0, 3]
+  - ["IT", 1442016000000, 0, 39091, null, 1442019600000, 0, 565, 1]
+  - ["IT", 1442019600000, 183, 39091, null, 1442023200000, 0, 565, 1]
+  - ["IT", 1442023200000, 111, 39091, 1442016000000, 1442026800000, 0, 565, 1]
+  - ["IT", 1442026800000, 222, 39091, 1442019600000, 1442030400000, 0, 565, 1]
+  - ["IT", 1442030400000, -17, 39091, 1442023200000, 1442034000000, 0, 565, 1]
+  - ["IT", 1442034000000, 1006, 39091, 1442026800000, 1442037600000, 0, 565, 1]
+  - ["IT", 1442037600000, -9, 39091, 1442030400000, 1442041200000, 0, 565, 1]
+  - ["IT", 1442041200000, 20, 39091, 1442034000000, 1442044800000, 0, 565, 1]
+  - ["IT", 1442044800000, 1483, 39091, 1442037600000, 1442048400000, 0, 565, 2]
+  - ["IT", 1442048400000, 676, 39091, 1442041200000, 1442052000000, 0, 565, 2]
+  - ["IT", 1442052000000, 1880, 39091, 1442044800000, 1442055600000, 0, 565, 2]
+  - ["IT", 1442055600000, 6240, 39091, 1442048400000, 1442059200000, 0, 565, 2]
+  - ["IT", 1442059200000, 542, 39091, 1442052000000, 1442062800000, 0, 565, 2]
+  - ["IT", 1442062800000, 1938, 39091, 1442055600000, 1442066400000, 0, 565, 2]
+  - ["IT", 1442066400000, 4155, 39091, 1442059200000, 1442070000000, 0, 565, 2]
+  - ["IT", 1442070000000, 81, 39091, 1442062800000, 1442073600000, 0, 565, 2]
+  - ["IT", 1442073600000, 2586, 39091, 1442066400000, 1442077200000, 0, 565, 3]
+  - ["IT", 1442077200000, 2188, 39091, 1442070000000, 1442080800000, 0, 565, 3]
+  - ["IT", 1442080800000, 5544, 39091, 1442073600000, 1442084400000, 0, 565, 3]
+  - ["IT", 1442084400000, 2660, 39091, 1442077200000, 1442088000000, 0, 565, 3]
+  - ["IT", 1442088000000, 3746, 39091, 1442080800000, 1442091600000, 0, 565, 3]
+  - ["IT", 1442091600000, 351, 39091, 1442084400000, 1442095200000, 0, 565, 3]
+  - ["IT", 1442095200000, 2940, 39091, 1442088000000, 1442098800000, 0, 565, 3]
+  - ["IT", 1442098800000, 565, 39091, 1442091600000, null, 0, 565, 3]
+  - ["JM", 1442070000000, 30, 30, null, null, 30, 30, 1]
+  - ["JO", 1442055600000, -2, 2, null, 1442059200000, -2, 4, 1]
+  - ["JO", 1442059200000, 0, 2, null, 1442080800000, -2, 4, 2]
+  - ["JO", 1442080800000, 4, 2, 1442055600000, null, -2, 4, 3]
+  - ["JP", 1442016000000, -113, 20378, null, 1442019600000, -113, -6, 1]
+  - ["JP", 1442019600000, 2002, 20378, null, 1442023200000, -113, -6, 1]
+  - ["JP", 1442023200000, 1959, 20378, 1442016000000, 1442026800000, -113, -6, 1]
+  - ["JP", 1442026800000, 1035, 20378, 1442019600000, 1442030400000, -113, -6, 1]
+  - ["JP", 1442030400000, 805, 20378, 1442023200000, 1442034000000, -113, -6, 1]
+  - ["JP", 1442034000000, 910, 20378, 1442026800000, 1442037600000, -113, -6, 1]
+  - ["JP", 1442037600000, 2181, 20378, 1442030400000, 1442041200000, -113, -6, 1]
+  - ["JP", 1442041200000, 1373, 20378, 1442034000000, 1442044800000, -113, -6, 1]
+  - ["JP", 1442044800000, 1569, 20378, 1442037600000, 1442048400000, -113, -6, 2]
+  - ["JP", 1442048400000, 1981, 20378, 1442041200000, 1442052000000, -113, -6, 2]
+  - ["JP", 1442052000000, 2789, 20378, 1442044800000, 1442055600000, -113, -6, 2]
+  - ["JP", 1442055600000, 998, 20378, 1442048400000, 1442059200000, -113, -6, 2]
+  - ["JP", 1442059200000, -85, 20378, 1442052000000, 1442062800000, -113, -6, 2]
+  - ["JP", 1442062800000, 803, 20378, 1442055600000, 1442066400000, -113, -6, 2]
+  - ["JP", 1442066400000, 167, 20378, 1442059200000, 1442070000000, -113, -6, 2]
+  - ["JP", 1442070000000, 79, 20378, 1442062800000, 1442073600000, -113, -6, 2]
+  - ["JP", 1442073600000, 1162, 20378, 1442066400000, 1442077200000, -113, -6, 3]
+  - ["JP", 1442077200000, 51, 20378, 1442070000000, 1442080800000, -113, -6, 3]
+  - ["JP", 1442080800000, 420, 20378, 1442073600000, 1442084400000, -113, -6, 3]
+  - ["JP", 1442084400000, 13, 20378, 1442077200000, 1442088000000, -113, -6, 3]
+  - ["JP", 1442088000000, 57, 20378, 1442080800000, 1442091600000, -113, -6, 3]
+  - ["JP", 1442091600000, 228, 20378, 1442084400000, 1442095200000, -113, -6, 3]
+  - ["JP", 1442095200000, 0, 20378, 1442088000000, 1442098800000, -113, -6, 3]
+  - ["JP", 1442098800000, -6, 20378, 1442091600000, null, -113, -6, 3]
+  - ["KE", 1442044800000, -1, -1, null, null, -1, -1, 1]
+  - ["KG", 1442073600000, 6, 6, null, null, 6, 6, 1]
+  - ["KR", 1442016000000, 1024, 13597, null, 1442019600000, 1024, -36, 1]
+  - ["KR", 1442019600000, 445, 13597, null, 1442023200000, 1024, -36, 1]
+  - ["KR", 1442023200000, 319, 13597, 1442016000000, 1442026800000, 1024, -36, 1]
+  - ["KR", 1442026800000, -179, 13597, 1442019600000, 1442030400000, 1024, -36, 1]
+  - ["KR", 1442030400000, 1035, 13597, 1442023200000, 1442034000000, 1024, -36, 1]
+  - ["KR", 1442034000000, 434, 13597, 1442026800000, 1442037600000, 1024, -36, 1]
+  - ["KR", 1442037600000, 26, 13597, 1442030400000, 1442041200000, 1024, -36, 1]
+  - ["KR", 1442041200000, 20, 13597, 1442034000000, 1442044800000, 1024, -36, 1]
+  - ["KR", 1442044800000, 829, 13597, 1442037600000, 1442048400000, 1024, -36, 2]
+  - ["KR", 1442048400000, -374, 13597, 1442041200000, 1442052000000, 1024, -36, 2]
+  - ["KR", 1442052000000, -3, 13597, 1442044800000, 1442055600000, 1024, -36, 2]
+  - ["KR", 1442055600000, 3640, 13597, 1442048400000, 1442059200000, 1024, -36, 2]
+  - ["KR", 1442059200000, 208, 13597, 1442052000000, 1442062800000, 1024, -36, 2]
+  - ["KR", 1442062800000, 1096, 13597, 1442055600000, 1442066400000, 1024, -36, 2]
+  - ["KR", 1442066400000, 3299, 13597, 1442059200000, 1442070000000, 1024, -36, 2]
+  - ["KR", 1442070000000, 222, 13597, 1442062800000, 1442077200000, 1024, -36, 3]
+  - ["KR", 1442077200000, -40, 13597, 1442066400000, 1442080800000, 1024, -36, 3]
+  - ["KR", 1442080800000, -33, 13597, 1442070000000, 1442084400000, 1024, -36, 3]
+  - ["KR", 1442084400000, 314, 13597, 1442077200000, 1442088000000, 1024, -36, 3]
+  - ["KR", 1442088000000, 524, 13597, 1442080800000, 1442095200000, 1024, -36, 3]
+  - ["KR", 1442095200000, 827, 13597, 1442084400000, 1442098800000, 1024, -36, 3]
+  - ["KR", 1442098800000, -36, 13597, 1442088000000, null, 1024, -36, 3]
+  - ["KW", 1442055600000, -2, 1778, null, 1442070000000, -2, -33, 1]
+  - ["KW", 1442070000000, 1815, 1778, null, 1442077200000, -2, -33, 1]
+  - ["KW", 1442077200000, -2, 1778, 1442055600000, 1442080800000, -2, -33, 2]
+  - ["KW", 1442080800000, -33, 1778, 1442070000000, null, -2, -33, 3]
+  - ["KZ", 1442034000000, 161, 1261, null, 1442044800000, 161, 91, 1]
+  - ["KZ", 1442044800000, 401, 1261, null, 1442048400000, 161, 91, 1]
+  - ["KZ", 1442048400000, 439, 1261, 1442034000000, 1442052000000, 161, 91, 1]
+  - ["KZ", 1442052000000, 412, 1261, 1442044800000, 1442055600000, 161, 91, 1]
+  - ["KZ", 1442055600000, 63, 1261, 1442048400000, 1442059200000, 161, 91, 2]
+  - ["KZ", 1442059200000, 33, 1261, 1442052000000, 1442062800000, 161, 91, 2]
+  - ["KZ", 1442062800000, 0, 1261, 1442055600000, 1442066400000, 161, 91, 2]
+  - ["KZ", 1442066400000, 0, 1261, 1442059200000, 1442077200000, 161, 91, 2]
+  - ["KZ", 1442077200000, -317, 1261, 1442062800000, 1442084400000, 161, 91, 3]
+  - ["KZ", 1442084400000, -22, 1261, 1442066400000, 1442095200000, 161, 91, 3]
+  - ["KZ", 1442095200000, 91, 1261, 1442077200000, null, 161, 91, 3]
+  - ["LB", 1442055600000, -67, -67, null, null, -67, -67, 1]
+  - ["LK", 1442026800000, 79, 131, null, 1442048400000, 79, -3, 1]
+  - ["LK", 1442048400000, 8, 131, null, 1442052000000, 79, -3, 1]
+  - ["LK", 1442052000000, 47, 131, 1442026800000, 1442084400000, 79, -3, 2]
+  - ["LK", 1442084400000, -3, 131, 1442048400000, null, 79, -3, 3]
+  - ["LT", 1442080800000, 12, -12, null, 1442098800000, 12, -24, 1]
+  - ["LT", 1442098800000, -24, -12, null, null, 12, -24, 2]
+  - ["LU", 1442059200000, 79, 606, null, 1442066400000, 79, 2, 1]
+  - ["LU", 1442066400000, 0, 606, null, 1442077200000, 79, 2, 1]
+  - ["LU", 1442077200000, 525, 606, 1442059200000, 1442095200000, 79, 2, 2]
+  - ["LU", 1442095200000, 2, 606, 1442066400000, null, 79, 2, 3]
+  - ["LV", 1442095200000, 0, 0, null, null, 0, 0, 1]
+  - ["MA", 1442019600000, -1, 229, null, 1442055600000, -1, 8, 1]
+  - ["MA", 1442055600000, 23, 229, null, 1442059200000, -1, 8, 1]
+  - ["MA", 1442059200000, -56, 229, 1442019600000, 1442062800000, -1, 8, 1]
+  - ["MA", 1442062800000, 0, 229, 1442055600000, 1442077200000, -1, 8, 2]
+  - ["MA", 1442077200000, 250, 229, 1442059200000, 1442080800000, -1, 8, 2]
+  - ["MA", 1442080800000, 5, 229, 1442062800000, 1442098800000, -1, 8, 3]
+  - ["MA", 1442098800000, 8, 229, 1442077200000, null, -1, 8, 3]
+  - ["MD", 1442077200000, 6916, 6916, null, null, 6916, 6916, 1]
+  - ["ME", 1442073600000, 0, 0, null, null, 0, 0, 1]
+  - ["MH", 1442052000000, 40, 40, null, null, 40, 40, 1]
+  - ["MK", 1442077200000, -72, -72, null, null, -72, -72, 1]
+  - ["MM", 1442070000000, 3, 28, null, 1442073600000, 3, 25, 1]
+  - ["MM", 1442073600000, 25, 28, null, null, 3, 25, 2]
+  - ["MO", 1442034000000, 30, 48, null, 1442070000000, 30, 18, 1]
+  - ["MO", 1442070000000, 18, 48, null, null, 30, 18, 2]
+  - ["MR", 1442080800000, 10, 10, null, null, 10, 10, 1]
+  - ["MT", 1442048400000, -1, -1, null, null, -1, -1, 1]
+  - ["MV", 1442073600000, -3, -3, null, null, -3, -3, 1]
+  - ["MX", 1442016000000, -67, 10472, null, 1442023200000, -67, 28, 1]
+  - ["MX", 1442023200000, 549, 10472, null, 1442026800000, -67, 28, 1]
+  - ["MX", 1442026800000, 3642, 10472, 1442016000000, 1442030400000, -67, 28, 1]
+  - ["MX", 1442030400000, 373, 10472, 1442023200000, 1442034000000, -67, 28, 1]
+  - ["MX", 1442034000000, 944, 10472, 1442026800000, 1442037600000, -67, 28, 1]
+  - ["MX", 1442037600000, 4, 10472, 1442030400000, 1442041200000, -67, 28, 1]
+  - ["MX", 1442041200000, -294, 10472, 1442034000000, 1442066400000, -67, 28, 2]
+  - ["MX", 1442066400000, -1, 10472, 1442037600000, 1442070000000, -67, 28, 2]
+  - ["MX", 1442070000000, -1, 10472, 1442041200000, 1442073600000, -67, 28, 2]
+  - ["MX", 1442073600000, -21, 10472, 1442066400000, 1442077200000, -67, 28, 2]
+  - ["MX", 1442077200000, 3874, 10472, 1442070000000, 1442080800000, -67, 28, 2]
+  - ["MX", 1442080800000, -376, 10472, 1442073600000, 1442084400000, -67, 28, 2]
+  - ["MX", 1442084400000, 981, 10472, 1442077200000, 1442088000000, -67, 28, 3]
+  - ["MX", 1442088000000, 494, 10472, 1442080800000, 1442091600000, -67, 28, 3]
+  - ["MX", 1442091600000, 799, 10472, 1442084400000, 1442095200000, -67, 28, 3]
+  - ["MX", 1442095200000, -456, 10472, 1442088000000, 1442098800000, -67, 28, 3]
+  - ["MX", 1442098800000, 28, 10472, 1442091600000, null, -67, 28, 3]
+  - ["MY", 1442019600000, -7, 3207, null, 1442030400000, -7, 739, 1]
+  - ["MY", 1442030400000, -3, 3207, null, 1442034000000, -7, 739, 1]
+  - ["MY", 1442034000000, 1028, 3207, 1442019600000, 1442041200000, -7, 739, 1]
+  - ["MY", 1442041200000, 935, 3207, 1442030400000, 1442044800000, -7, 739, 1]
+  - ["MY", 1442044800000, -127, 3207, 1442034000000, 1442048400000, -7, 739, 2]
+  - ["MY", 1442048400000, 649, 3207, 1442041200000, 1442055600000, -7, 739, 2]
+  - ["MY", 1442055600000, 1, 3207, 1442044800000, 1442059200000, -7, 739, 2]
+  - ["MY", 1442059200000, 0, 3207, 1442048400000, 1442066400000, -7, 739, 2]
+  - ["MY", 1442066400000, 1, 3207, 1442055600000, 1442073600000, -7, 739, 3]
+  - ["MY", 1442073600000, 1, 3207, 1442059200000, 1442077200000, -7, 739, 3]
+  - ["MY", 1442077200000, -10, 3207, 1442066400000, 1442098800000, -7, 739, 3]
+  - ["MY", 1442098800000, 739, 3207, 1442073600000, null, -7, 739, 3]
+  - ["NG", 1442052000000, 208, 214, null, 1442070000000, 208, 6, 1]
+  - ["NG", 1442070000000, 6, 214, null, null, 208, 6, 2]
+  - ["NL", 1442034000000, 0, 12162, null, 1442044800000, 0, 4, 1]
+  - ["NL", 1442044800000, 16, 12162, null, 1442048400000, 0, 4, 1]
+  - ["NL", 1442048400000, 1303, 12162, 1442034000000, 1442052000000, 0, 4, 1]
+  - ["NL", 1442052000000, 53, 12162, 1442044800000, 1442055600000, 0, 4, 1]
+  - ["NL", 1442055600000, 105, 12162, 1442048400000, 1442059200000, 0, 4, 1]
+  - ["NL", 1442059200000, 206, 12162, 1442052000000, 1442062800000, 0, 4, 1]
+  - ["NL", 1442062800000, -30, 12162, 1442055600000, 1442066400000, 0, 4, 2]
+  - ["NL", 1442066400000, 61, 12162, 1442059200000, 1442070000000, 0, 4, 2]
+  - ["NL", 1442070000000, -84, 12162, 1442062800000, 1442073600000, 0, 4, 2]
+  - ["NL", 1442073600000, 166, 12162, 1442066400000, 1442077200000, 0, 4, 2]
+  - ["NL", 1442077200000, 878, 12162, 1442070000000, 1442080800000, 0, 4, 2]
+  - ["NL", 1442080800000, 8947, 12162, 1442073600000, 1442084400000, 0, 4, 2]
+  - ["NL", 1442084400000, 436, 12162, 1442077200000, 1442088000000, 0, 4, 3]
+  - ["NL", 1442088000000, 12, 12162, 1442080800000, 1442091600000, 0, 4, 3]
+  - ["NL", 1442091600000, 19, 12162, 1442084400000, 1442095200000, 0, 4, 3]
+  - ["NL", 1442095200000, 70, 12162, 1442088000000, 1442098800000, 0, 4, 3]
+  - ["NL", 1442098800000, 4, 12162, 1442091600000, null, 0, 4, 3]
+  - ["NO", 1442019600000, 48, 432, null, 1442048400000, 48, 2, 1]
+  - ["NO", 1442048400000, -447, 432, null, 1442052000000, 48, 2, 1]
+  - ["NO", 1442052000000, 447, 432, 1442019600000, 1442055600000, 48, 2, 1]
+  - ["NO", 1442055600000, 29, 432, 1442048400000, 1442066400000, 48, 2, 1]
+  - ["NO", 1442066400000, 71, 432, 1442052000000, 1442073600000, 48, 2, 2]
+  - ["NO", 1442073600000, 222, 432, 1442055600000, 1442080800000, 48, 2, 2]
+  - ["NO", 1442080800000, 31, 432, 1442066400000, 1442088000000, 48, 2, 2]
+  - ["NO", 1442088000000, 15, 432, 1442073600000, 1442091600000, 48, 2, 2]
+  - ["NO", 1442091600000, 15, 432, 1442080800000, 1442095200000, 48, 2, 3]
+  - ["NO", 1442095200000, -1, 432, 1442088000000, 1442098800000, 48, 2, 3]
+  - ["NO", 1442098800000, 2, 432, 1442091600000, null, 48, 2, 3]
+  - ["NP", 1442048400000, 61, 61, null, null, 61, 61, 1]
+  - ["NZ", 1442019600000, 28, 1693, null, 1442026800000, 28, -2, 1]
+  - ["NZ", 1442026800000, 635, 1693, null, 1442037600000, 28, -2, 1]
+  - ["NZ", 1442037600000, 66, 1693, 1442019600000, 1442048400000, 28, -2, 1]
+  - ["NZ", 1442048400000, 189, 1693, 1442026800000, 1442059200000, 28, -2, 2]
+  - ["NZ", 1442059200000, 428, 1693, 1442037600000, 1442084400000, 28, -2, 2]
+  - ["NZ", 1442084400000, -52, 1693, 1442048400000, 1442088000000, 28, -2, 2]
+  - ["NZ", 1442088000000, 405, 1693, 1442059200000, 1442095200000, 28, -2, 3]
+  - ["NZ", 1442095200000, -4, 1693, 1442084400000, 1442098800000, 28, -2, 3]
+  - ["NZ", 1442098800000, -2, 1693, 1442088000000, null, 28, -2, 3]
+  - ["OM", 1442052000000, 0, 0, null, null, 0, 0, 1]
+  - ["PA", 1442026800000, 0, 0, null, null, 0, 0, 1]
+  - ["PE", 1442019600000, 523, 2134, null, 1442023200000, 523, 1861, 1]
+  - ["PE", 1442023200000, 26, 2134, null, 1442026800000, 523, 1861, 1]
+  - ["PE", 1442026800000, -12, 2134, 1442019600000, 1442062800000, 523, 1861, 1]
+  - ["PE", 1442062800000, -12, 2134, 1442023200000, 1442077200000, 523, 1861, 2]
+  - ["PE", 1442077200000, -163, 2134, 1442026800000, 1442080800000, 523, 1861, 2]
+  - ["PE", 1442080800000, -2, 2134, 1442062800000, 1442084400000, 523, 1861, 2]
+  - ["PE", 1442084400000, -68, 2134, 1442077200000, 1442095200000, 523, 1861, 3]
+  - ["PE", 1442095200000, -19, 2134, 1442080800000, 1442098800000, 523, 1861, 3]
+  - ["PE", 1442098800000, 1861, 2134, 1442084400000, null, 523, 1861, 3]
+  - ["PH", 1442019600000, 6, 6613, null, 1442023200000, 6, 8, 1]
+  - ["PH", 1442023200000, 459, 6613, null, 1442026800000, 6, 8, 1]
+  - ["PH", 1442026800000, 910, 6613, 1442019600000, 1442030400000, 6, 8, 1]
+  - ["PH", 1442030400000, 26, 6613, 1442023200000, 1442034000000, 6, 8, 1]
+  - ["PH", 1442034000000, 59, 6613, 1442026800000, 1442037600000, 6, 8, 1]
+  - ["PH", 1442037600000, 17, 6613, 1442030400000, 1442041200000, 6, 8, 1]
+  - ["PH", 1442041200000, 0, 6613, 1442034000000, 1442044800000, 6, 8, 1]
+  - ["PH", 1442044800000, 55, 6613, 1442037600000, 1442048400000, 6, 8, 2]
+  - ["PH", 1442048400000, 62, 6613, 1442041200000, 1442052000000, 6, 8, 2]
+  - ["PH", 1442052000000, 22, 6613, 1442044800000, 1442055600000, 6, 8, 2]
+  - ["PH", 1442055600000, 1969, 6613, 1442048400000, 1442059200000, 6, 8, 2]
+  - ["PH", 1442059200000, 273, 6613, 1442052000000, 1442062800000, 6, 8, 2]
+  - ["PH", 1442062800000, 171, 6613, 1442055600000, 1442066400000, 6, 8, 2]
+  - ["PH", 1442066400000, 1880, 6613, 1442059200000, 1442070000000, 6, 8, 2]
+  - ["PH", 1442070000000, 34, 6613, 1442062800000, 1442073600000, 6, 8, 3]
+  - ["PH", 1442073600000, -227, 6613, 1442066400000, 1442077200000, 6, 8, 3]
+  - ["PH", 1442077200000, 2, 6613, 1442070000000, 1442080800000, 6, 8, 3]
+  - ["PH", 1442080800000, 32, 6613, 1442073600000, 1442084400000, 6, 8, 3]
+  - ["PH", 1442084400000, 39, 6613, 1442077200000, 1442091600000, 6, 8, 3]
+  - ["PH", 1442091600000, 816, 6613, 1442080800000, 1442098800000, 6, 8, 3]
+  - ["PH", 1442098800000, 8, 6613, 1442084400000, null, 6, 8, 3]
+  - ["PK", 1442019600000, 335, 641, null, 1442026800000, 335, 43, 1]
+  - ["PK", 1442026800000, 101, 641, null, 1442037600000, 335, 43, 1]
+  - ["PK", 1442037600000, 100, 641, 1442019600000, 1442041200000, 335, 43, 1]
+  - ["PK", 1442041200000, 24, 641, 1442026800000, 1442048400000, 335, 43, 2]
+  - ["PK", 1442048400000, 15, 641, 1442037600000, 1442062800000, 335, 43, 2]
+  - ["PK", 1442062800000, 23, 641, 1442041200000, 1442070000000, 335, 43, 3]
+  - ["PK", 1442070000000, 43, 641, 1442048400000, null, 335, 43, 3]
+  - ["PL", 1442037600000, 95, 9815, null, 1442041200000, 95, -9, 1]
+  - ["PL", 1442041200000, 281, 9815, null, 1442044800000, 95, -9, 1]
+  - ["PL", 1442044800000, 319, 9815, 1442037600000, 1442048400000, 95, -9, 1]
+  - ["PL", 1442048400000, 366, 9815, 1442041200000, 1442052000000, 95, -9, 1]
+  - ["PL", 1442052000000, 330, 9815, 1442044800000, 1442055600000, 95, -9, 1]
+  - ["PL", 1442055600000, 410, 9815, 1442048400000, 1442059200000, 95, -9, 1]
+  - ["PL", 1442059200000, 199, 9815, 1442052000000, 1442062800000, 95, -9, 2]
+  - ["PL", 1442062800000, 4171, 9815, 1442055600000, 1442066400000, 95, -9, 2]
+  - ["PL", 1442066400000, 34, 9815, 1442059200000, 1442070000000, 95, -9, 2]
+  - ["PL", 1442070000000, 146, 9815, 1442062800000, 1442073600000, 95, -9, 2]
+  - ["PL", 1442073600000, 30, 9815, 1442066400000, 1442077200000, 95, -9, 2]
+  - ["PL", 1442077200000, 324, 9815, 1442070000000, 1442080800000, 95, -9, 2]
+  - ["PL", 1442080800000, 7, 9815, 1442073600000, 1442084400000, 95, -9, 3]
+  - ["PL", 1442084400000, 13, 9815, 1442077200000, 1442088000000, 95, -9, 3]
+  - ["PL", 1442088000000, 346, 9815, 1442080800000, 1442091600000, 95, -9, 3]
+  - ["PL", 1442091600000, 902, 9815, 1442084400000, 1442095200000, 95, -9, 3]
+  - ["PL", 1442095200000, 1851, 9815, 1442088000000, 1442098800000, 95, -9, 3]
+  - ["PL", 1442098800000, -9, 9815, 1442091600000, null, 95, -9, 3]
+  - ["PR", 1442026800000, 22, 23, null, 1442030400000, 22, 29, 1]
+  - ["PR", 1442030400000, 2, 23, null, 1442059200000, 22, 29, 1]
+  - ["PR", 1442059200000, -35, 23, 1442026800000, 1442077200000, 22, 29, 2]
+  - ["PR", 1442077200000, 5, 23, 1442030400000, 1442095200000, 22, 29, 2]
+  - ["PR", 1442095200000, 29, 23, 1442059200000, null, 22, 29, 3]
+  - ["PT", 1442019600000, 172, 4037, null, 1442044800000, 172, 2, 1]
+  - ["PT", 1442044800000, 11, 4037, null, 1442052000000, 172, 2, 1]
+  - ["PT", 1442052000000, 102, 4037, 1442019600000, 1442066400000, 172, 2, 1]
+  - ["PT", 1442066400000, 12, 4037, 1442044800000, 1442070000000, 172, 2, 1]
+  - ["PT", 1442070000000, 3470, 4037, 1442052000000, 1442077200000, 172, 2, 2]
+  - ["PT", 1442077200000, -75, 4037, 1442066400000, 1442080800000, 172, 2, 2]
+  - ["PT", 1442080800000, -79, 4037, 1442070000000, 1442088000000, 172, 2, 2]
+  - ["PT", 1442088000000, 403, 4037, 1442077200000, 1442095200000, 172, 2, 3]
+  - ["PT", 1442095200000, 19, 4037, 1442080800000, 1442098800000, 172, 2, 3]
+  - ["PT", 1442098800000, 2, 4037, 1442088000000, null, 172, 2, 3]
+  - ["PY", 1442019600000, 1, 634, null, 1442080800000, 1, 628, 1]
+  - ["PY", 1442080800000, 5, 634, null, 1442084400000, 1, 628, 2]
+  - ["PY", 1442084400000, 628, 634, 1442019600000, null, 1, 628, 3]
+  - ["QA", 1442041200000, 13, 13, null, null, 13, 13, 1]
+  - ["RO", 1442034000000, 68, 2893, null, 1442041200000, 68, 824, 1]
+  - ["RO", 1442041200000, 845, 2893, null, 1442044800000, 68, 824, 1]
+  - ["RO", 1442044800000, 284, 2893, 1442034000000, 1442052000000, 68, 824, 1]
+  - ["RO", 1442052000000, 319, 2893, 1442041200000, 1442055600000, 68, 824, 1]
+  - ["RO", 1442055600000, 26, 2893, 1442044800000, 1442062800000, 68, 824, 2]
+  - ["RO", 1442062800000, 541, 2893, 1442052000000, 1442070000000, 68, 824, 2]
+  - ["RO", 1442070000000, -29, 2893, 1442055600000, 1442073600000, 68, 824, 2]
+  - ["RO", 1442073600000, 15, 2893, 1442062800000, 1442091600000, 68, 824, 3]
+  - ["RO", 1442091600000, 0, 2893, 1442070000000, 1442095200000, 68, 824, 3]
+  - ["RO", 1442095200000, 824, 2893, 1442073600000, null, 68, 824, 3]
+  - ["RS", 1442019600000, 6, 906, null, 1442062800000, 6, -15, 1]
+  - ["RS", 1442062800000, 13, 906, null, 1442066400000, 6, -15, 1]
+  - ["RS", 1442066400000, 0, 906, 1442019600000, 1442073600000, 6, -15, 1]
+  - ["RS", 1442073600000, 813, 906, 1442062800000, 1442080800000, 6, -15, 2]
+  - ["RS", 1442080800000, 0, 906, 1442066400000, 1442084400000, 6, -15, 2]
+  - ["RS", 1442084400000, 89, 906, 1442073600000, 1442091600000, 6, -15, 3]
+  - ["RS", 1442091600000, -15, 906, 1442080800000, null, 6, -15, 3]
+  - ["RU", 1442019600000, 2214, 48104, null, 1442023200000, 2214, 12098, 1]
+  - ["RU", 1442023200000, 299, 48104, null, 1442026800000, 2214, 12098, 1]
+  - ["RU", 1442026800000, 0, 48104, 1442019600000, 1442030400000, 2214, 12098, 1]
+  - ["RU", 1442030400000, 76, 48104, 1442023200000, 1442034000000, 2214, 12098, 1]
+  - ["RU", 1442034000000, 658, 48104, 1442026800000, 1442037600000, 2214, 12098, 1]
+  - ["RU", 1442037600000, -324, 48104, 1442030400000, 1442041200000, 2214, 12098, 1]
+  - ["RU", 1442041200000, 580, 48104, 1442034000000, 1442044800000, 2214, 12098, 1]
+  - ["RU", 1442044800000, 2564, 48104, 1442037600000, 1442048400000, 2214, 12098, 1]
+  - ["RU", 1442048400000, 1027, 48104, 1442041200000, 1442052000000, 2214, 12098, 2]
+  - ["RU", 1442052000000, 1214, 48104, 1442044800000, 1442055600000, 2214, 12098, 2]
+  - ["RU", 1442055600000, 499, 48104, 1442048400000, 1442059200000, 2214, 12098, 2]
+  - ["RU", 1442059200000, 3902, 48104, 1442052000000, 1442062800000, 2214, 12098, 2]
+  - ["RU", 1442062800000, 168, 48104, 1442055600000, 1442066400000, 2214, 12098, 2]
+  - ["RU", 1442066400000, 2047, 48104, 1442059200000, 1442070000000, 2214, 12098, 2]
+  - ["RU", 1442070000000, 4706, 48104, 1442062800000, 1442073600000, 2214, 12098, 2]
+  - ["RU", 1442073600000, 1618, 48104, 1442066400000, 1442077200000, 2214, 12098, 2]
+  - ["RU", 1442077200000, 1162, 48104, 1442070000000, 1442080800000, 2214, 12098, 3]
+  - ["RU", 1442080800000, 655, 48104, 1442073600000, 1442084400000, 2214, 12098, 3]
+  - ["RU", 1442084400000, 6461, 48104, 1442077200000, 1442088000000, 2214, 12098, 3]
+  - ["RU", 1442088000000, 2596, 48104, 1442080800000, 1442091600000, 2214, 12098, 3]
+  - ["RU", 1442091600000, 3449, 48104, 1442084400000, 1442095200000, 2214, 12098, 3]
+  - ["RU", 1442095200000, 435, 48104, 1442088000000, 1442098800000, 2214, 12098, 3]
+  - ["RU", 1442098800000, 12098, 48104, 1442091600000, null, 2214, 12098, 3]
+  - ["SA", 1442037600000, -97, 1614, null, 1442048400000, -97, 458, 1]
+  - ["SA", 1442048400000, 14, 1614, null, 1442055600000, -97, 458, 1]
+  - ["SA", 1442055600000, 11, 1614, 1442037600000, 1442059200000, -97, 458, 1]
+  - ["SA", 1442059200000, 0, 1614, 1442048400000, 1442066400000, -97, 458, 2]
+  - ["SA", 1442066400000, 1276, 1614, 1442055600000, 1442073600000, -97, 458, 2]
+  - ["SA", 1442073600000, 2, 1614, 1442059200000, 1442077200000, -97, 458, 2]
+  - ["SA", 1442077200000, -50, 1614, 1442066400000, 1442084400000, -97, 458, 3]
+  - ["SA", 1442084400000, 458, 1614, 1442073600000, null, -97, 458, 3]
+  - ["SE", 1442019600000, 109, 1838, null, 1442023200000, 109, 0, 1]
+  - ["SE", 1442023200000, 3, 1838, null, 1442030400000, 109, 0, 1]
+  - ["SE", 1442030400000, 30, 1838, 1442019600000, 1442041200000, 109, 0, 1]
+  - ["SE", 1442041200000, 91, 1838, 1442023200000, 1442048400000, 109, 0, 1]
+  - ["SE", 1442048400000, -145, 1838, 1442030400000, 1442052000000, 109, 0, 1]
+  - ["SE", 1442052000000, 1, 1838, 1442041200000, 1442055600000, 109, 0, 2]
+  - ["SE", 1442055600000, -5, 1838, 1442048400000, 1442059200000, 109, 0, 2]
+  - ["SE", 1442059200000, 1476, 1838, 1442052000000, 1442066400000, 109, 0, 2]
+  - ["SE", 1442066400000, 14, 1838, 1442055600000, 1442070000000, 109, 0, 2]
+  - ["SE", 1442070000000, 78, 1838, 1442059200000, 1442080800000, 109, 0, 2]
+  - ["SE", 1442080800000, 89, 1838, 1442066400000, 1442084400000, 109, 0, 3]
+  - ["SE", 1442084400000, 37, 1838, 1442070000000, 1442091600000, 109, 0, 3]
+  - ["SE", 1442091600000, -1, 1838, 1442080800000, 1442095200000, 109, 0, 3]
+  - ["SE", 1442095200000, 61, 1838, 1442084400000, 1442098800000, 109, 0, 3]
+  - ["SE", 1442098800000, 0, 1838, 1442091600000, null, 109, 0, 3]
+  - ["SG", 1442026800000, 2758, 3338, null, 1442030400000, 2758, 0, 1]
+  - ["SG", 1442030400000, 1, 3338, null, 1442037600000, 2758, 0, 1]
+  - ["SG", 1442037600000, 3, 3338, 1442026800000, 1442041200000, 2758, 0, 1]
+  - ["SG", 1442041200000, 59, 3338, 1442030400000, 1442044800000, 2758, 0, 2]
+  - ["SG", 1442044800000, 77, 3338, 1442037600000, 1442048400000, 2758, 0, 2]
+  - ["SG", 1442048400000, 52, 3338, 1442041200000, 1442062800000, 2758, 0, 2]
+  - ["SG", 1442062800000, 388, 3338, 1442044800000, 1442066400000, 2758, 0, 3]
+  - ["SG", 1442066400000, 0, 3338, 1442048400000, null, 2758, 0, 3]
+  - ["SI", 1442080800000, -45, -36, null, 1442091600000, -45, 9, 1]
+  - ["SI", 1442091600000, 9, -36, null, null, -45, 9, 2]
+  - ["SK", 1442037600000, -1, 379, null, 1442052000000, -1, 7, 1]
+  - ["SK", 1442052000000, 13, 379, null, 1442062800000, -1, 7, 1]
+  - ["SK", 1442062800000, 6, 379, 1442037600000, 1442073600000, -1, 7, 2]
+  - ["SK", 1442073600000, 446, 379, 1442052000000, 1442084400000, -1, 7, 2]
+  - ["SK", 1442084400000, -92, 379, 1442062800000, 1442098800000, -1, 7, 3]
+  - ["SK", 1442098800000, 7, 379, 1442073600000, null, -1, 7, 3]
+  - ["SV", 1442019600000, -1, 114, null, 1442084400000, -1, 9, 1]
+  - ["SV", 1442084400000, 106, 114, null, 1442088000000, -1, 9, 2]
+  - ["SV", 1442088000000, 9, 114, 1442019600000, null, -1, 9, 3]
+  - ["TH", 1442034000000, 0, 24, null, 1442041200000, 0, 13, 1]
+  - ["TH", 1442041200000, 3, 24, null, 1442044800000, 0, 13, 1]
+  - ["TH", 1442044800000, 110, 24, 1442034000000, 1442052000000, 0, 13, 1]
+  - ["TH", 1442052000000, -22, 24, 1442041200000, 1442055600000, 0, 13, 2]
+  - ["TH", 1442055600000, 0, 24, 1442044800000, 1442062800000, 0, 13, 2]
+  - ["TH", 1442062800000, -46, 24, 1442052000000, 1442066400000, 0, 13, 2]
+  - ["TH", 1442066400000, -34, 24, 1442055600000, 1442070000000, 0, 13, 3]
+  - ["TH", 1442070000000, 0, 24, 1442062800000, 1442084400000, 0, 13, 3]
+  - ["TH", 1442084400000, 13, 24, 1442066400000, null, 0, 13, 3]
+  - ["TJ", 1442048400000, 1471, 1471, null, null, 1471, 1471, 1]
+  - ["TN", 1442098800000, -9, -9, null, null, -9, -9, 1]
+  - ["TR", 1442023200000, 306, 7078, null, 1442041200000, 306, -29, 1]
+  - ["TR", 1442041200000, 1, 7078, null, 1442044800000, 306, -29, 1]
+  - ["TR", 1442044800000, 41, 7078, 1442023200000, 1442048400000, 306, -29, 1]
+  - ["TR", 1442048400000, 88, 7078, 1442041200000, 1442052000000, 306, -29, 1]
+  - ["TR", 1442052000000, 41, 7078, 1442044800000, 1442055600000, 306, -29, 1]
+  - ["TR", 1442055600000, 299, 7078, 1442048400000, 1442062800000, 306, -29, 2]
+  - ["TR", 1442062800000, 315, 7078, 1442052000000, 1442066400000, 306, -29, 2]
+  - ["TR", 1442066400000, 85, 7078, 1442055600000, 1442070000000, 306, -29, 2]
+  - ["TR", 1442070000000, 236, 7078, 1442062800000, 1442077200000, 306, -29, 2]
+  - ["TR", 1442077200000, 89, 7078, 1442066400000, 1442080800000, 306, -29, 2]
+  - ["TR", 1442080800000, -1, 7078, 1442070000000, 1442084400000, 306, -29, 3]
+  - ["TR", 1442084400000, 170, 7078, 1442077200000, 1442088000000, 306, -29, 3]
+  - ["TR", 1442088000000, 2389, 7078, 1442080800000, 1442091600000, 306, -29, 3]
+  - ["TR", 1442091600000, 3048, 7078, 1442084400000, 1442095200000, 306, -29, 3]
+  - ["TR", 1442095200000, -29, 7078, 1442088000000, null, 306, -29, 3]
+  - ["TT", 1442088000000, 9, 9, null, null, 9, 9, 1]
+  - ["TW", 1442016000000, 92, 3656, null, 1442019600000, 92, -60, 1]
+  - ["TW", 1442019600000, 0, 3656, null, 1442023200000, 92, -60, 1]
+  - ["TW", 1442023200000, 97, 3656, 1442016000000, 1442026800000, 92, -60, 1]
+  - ["TW", 1442026800000, 680, 3656, 1442019600000, 1442030400000, 92, -60, 1]
+  - ["TW", 1442030400000, 0, 3656, 1442023200000, 1442034000000, 92, -60, 1]
+  - ["TW", 1442034000000, 143, 3656, 1442026800000, 1442037600000, 92, -60, 1]
+  - ["TW", 1442037600000, 266, 3656, 1442030400000, 1442041200000, 92, -60, 1]
+  - ["TW", 1442041200000, 366, 3656, 1442034000000, 1442044800000, 92, -60, 1]
+  - ["TW", 1442044800000, 24, 3656, 1442037600000, 1442048400000, 92, -60, 2]
+  - ["TW", 1442048400000, 75, 3656, 1442041200000, 1442052000000, 92, -60, 2]
+  - ["TW", 1442052000000, 24, 3656, 1442044800000, 1442055600000, 92, -60, 2]
+  - ["TW", 1442055600000, 48, 3656, 1442048400000, 1442059200000, 92, -60, 2]
+  - ["TW", 1442059200000, -157, 3656, 1442052000000, 1442062800000, 92, -60, 2]
+  - ["TW", 1442062800000, -272, 3656, 1442055600000, 1442066400000, 92, -60, 2]
+  - ["TW", 1442066400000, 624, 3656, 1442059200000, 1442070000000, 92, -60, 2]
+  - ["TW", 1442070000000, 485, 3656, 1442062800000, 1442073600000, 92, -60, 3]
+  - ["TW", 1442073600000, 772, 3656, 1442066400000, 1442077200000, 92, -60, 3]
+  - ["TW", 1442077200000, 502, 3656, 1442070000000, 1442080800000, 92, -60, 3]
+  - ["TW", 1442080800000, 24, 3656, 1442073600000, 1442084400000, 92, -60, 3]
+  - ["TW", 1442084400000, 0, 3656, 1442077200000, 1442095200000, 92, -60, 3]
+  - ["TW", 1442095200000, -77, 3656, 1442080800000, 1442098800000, 92, -60, 3]
+  - ["TW", 1442098800000, -60, 3656, 1442084400000, null, 92, -60, 3]
+  - ["UA", 1442034000000, 3468, 24898, null, 1442037600000, 3468, 38, 1]
+  - ["UA", 1442037600000, -1, 24898, null, 1442041200000, 3468, 38, 1]
+  - ["UA", 1442041200000, 74, 24898, 1442034000000, 1442044800000, 3468, 38, 1]
+  - ["UA", 1442044800000, 280, 24898, 1442037600000, 1442048400000, 3468, 38, 1]
+  - ["UA", 1442048400000, 2, 24898, 1442041200000, 1442052000000, 3468, 38, 1]
+  - ["UA", 1442052000000, 410, 24898, 1442044800000, 1442055600000, 3468, 38, 1]
+  - ["UA", 1442055600000, 14202, 24898, 1442048400000, 1442059200000, 3468, 38, 1]
+  - ["UA", 1442059200000, -2, 24898, 1442052000000, 1442062800000, 3468, 38, 2]
+  - ["UA", 1442062800000, 773, 24898, 1442055600000, 1442066400000, 3468, 38, 2]
+  - ["UA", 1442066400000, 296, 24898, 1442059200000, 1442070000000, 3468, 38, 2]
+  - ["UA", 1442070000000, 1733, 24898, 1442062800000, 1442073600000, 3468, 38, 2]
+  - ["UA", 1442073600000, 4241, 24898, 1442066400000, 1442077200000, 3468, 38, 2]
+  - ["UA", 1442077200000, -181, 24898, 1442070000000, 1442080800000, 3468, 38, 2]
+  - ["UA", 1442080800000, -1, 24898, 1442073600000, 1442084400000, 3468, 38, 3]
+  - ["UA", 1442084400000, 5, 24898, 1442077200000, 1442088000000, 3468, 38, 3]
+  - ["UA", 1442088000000, -21, 24898, 1442080800000, 1442091600000, 3468, 38, 3]
+  - ["UA", 1442091600000, -388, 24898, 1442084400000, 1442095200000, 3468, 38, 3]
+  - ["UA", 1442095200000, -30, 24898, 1442088000000, 1442098800000, 3468, 38, 3]
+  - ["UA", 1442098800000, 38, 24898, 1442091600000, null, 3468, 38, 3]
+  - ["UG", 1442070000000, 1, 1, null, null, 1, 1, 1]
+  - ["US", 1442016000000, 0, 38882, null, 1442019600000, 0, 3575, 1]
+  - ["US", 1442019600000, 1043, 38882, null, 1442023200000, 0, 3575, 1]
+  - ["US", 1442023200000, 2844, 38882, 1442016000000, 1442026800000, 0, 3575, 1]
+  - ["US", 1442026800000, 1512, 38882, 1442019600000, 1442030400000, 0, 3575, 1]
+  - ["US", 1442030400000, 2023, 38882, 1442023200000, 1442034000000, 0, 3575, 1]
+  - ["US", 1442034000000, 3648, 38882, 1442026800000, 1442037600000, 0, 3575, 1]
+  - ["US", 1442037600000, 3675, 38882, 1442030400000, 1442041200000, 0, 3575, 1]
+  - ["US", 1442041200000, 1999, 38882, 1442034000000, 1442044800000, 0, 3575, 1]
+  - ["US", 1442044800000, 139, 38882, 1442037600000, 1442048400000, 0, 3575, 2]
+  - ["US", 1442048400000, -466, 38882, 1442041200000, 1442052000000, 0, 3575, 2]
+  - ["US", 1442052000000, -2, 38882, 1442044800000, 1442055600000, 0, 3575, 2]
+  - ["US", 1442055600000, 156, 38882, 1442048400000, 1442059200000, 0, 3575, 2]
+  - ["US", 1442059200000, 11, 38882, 1442052000000, 1442062800000, 0, 3575, 2]
+  - ["US", 1442062800000, 47, 38882, 1442055600000, 1442066400000, 0, 3575, 2]
+  - ["US", 1442066400000, 772, 38882, 1442059200000, 1442070000000, 0, 3575, 2]
+  - ["US", 1442070000000, 3505, 38882, 1442062800000, 1442073600000, 0, 3575, 2]
+  - ["US", 1442073600000, 1100, 38882, 1442066400000, 1442077200000, 0, 3575, 3]
+  - ["US", 1442077200000, 2168, 38882, 1442070000000, 1442080800000, 0, 3575, 3]
+  - ["US", 1442080800000, 4001, 38882, 1442073600000, 1442084400000, 0, 3575, 3]
+  - ["US", 1442084400000, 2523, 38882, 1442077200000, 1442088000000, 0, 3575, 3]
+  - ["US", 1442088000000, 1691, 38882, 1442080800000, 1442091600000, 0, 3575, 3]
+  - ["US", 1442091600000, 2502, 38882, 1442084400000, 1442095200000, 0, 3575, 3]
+  - ["US", 1442095200000, 416, 38882, 1442088000000, 1442098800000, 0, 3575, 3]
+  - ["US", 1442098800000, 3575, 38882, 1442091600000, null, 0, 3575, 3]
+  - ["UY", 1442019600000, 77, 936, null, 1442023200000, 77, 23, 1]
+  - ["UY", 1442023200000, 517, 936, null, 1442026800000, 77, 23, 1]
+  - ["UY", 1442026800000, 76, 936, 1442019600000, 1442037600000, 77, 23, 1]
+  - ["UY", 1442037600000, 1, 936, 1442023200000, 1442070000000, 77, 23, 2]
+  - ["UY", 1442070000000, 284, 936, 1442026800000, 1442073600000, 77, 23, 2]
+  - ["UY", 1442073600000, -42, 936, 1442037600000, 1442077200000, 77, 23, 3]
+  - ["UY", 1442077200000, 23, 936, 1442070000000, null, 77, 23, 3]
+  - ["UZ", 1442044800000, 1369, 1369, null, null, 1369, 1369, 1]
+  - ["VE", 1442023200000, 115, 1101, null, 1442026800000, 115, 9, 1]
+  - ["VE", 1442026800000, -17, 1101, null, 1442030400000, 115, 9, 1]
+  - ["VE", 1442030400000, 51, 1101, 1442023200000, 1442034000000, 115, 9, 1]
+  - ["VE", 1442034000000, -2, 1101, 1442026800000, 1442066400000, 115, 9, 1]
+  - ["VE", 1442066400000, 18, 1101, 1442030400000, 1442070000000, 115, 9, 2]
+  - ["VE", 1442070000000, 420, 1101, 1442034000000, 1442077200000, 115, 9, 2]
+  - ["VE", 1442077200000, 412, 1101, 1442066400000, 1442084400000, 115, 9, 2]
+  - ["VE", 1442084400000, 60, 1101, 1442070000000, 1442095200000, 115, 9, 3]
+  - ["VE", 1442095200000, 35, 1101, 1442077200000, 1442098800000, 115, 9, 3]
+  - ["VE", 1442098800000, 9, 1101, 1442084400000, null, 115, 9, 3]
+  - ["VG", 1442062800000, -238, -238, null, null, -238, -238, 1]
+  - ["VN", 1442023200000, -9, 1560, null, 1442026800000, -9, -10, 1]
+  - ["VN", 1442026800000, 63, 1560, null, 1442034000000, -9, -10, 1]
+  - ["VN", 1442034000000, -29, 1560, 1442023200000, 1442037600000, -9, -10, 1]
+  - ["VN", 1442037600000, -11, 1560, 1442026800000, 1442041200000, -9, -10, 1]
+  - ["VN", 1442041200000, 0, 1560, 1442034000000, 1442048400000, -9, -10, 1]
+  - ["VN", 1442048400000, -15, 1560, 1442037600000, 1442052000000, -9, -10, 2]
+  - ["VN", 1442052000000, 90, 1560, 1442041200000, 1442055600000, -9, -10, 2]
+  - ["VN", 1442055600000, 37, 1560, 1442048400000, 1442059200000, -9, -10, 2]
+  - ["VN", 1442059200000, 8, 1560, 1442052000000, 1442062800000, -9, -10, 2]
+  - ["VN", 1442062800000, 146, 1560, 1442055600000, 1442066400000, -9, -10, 3]
+  - ["VN", 1442066400000, 811, 1560, 1442059200000, 1442070000000, -9, -10, 3]
+  - ["VN", 1442070000000, 479, 1560, 1442062800000, 1442084400000, -9, -10, 3]
+  - ["VN", 1442084400000, -10, 1560, 1442066400000, null, -9, -10, 3]
+  - ["ZA", 1442034000000, -3, 127, null, 1442048400000, -3, 1, 1]
+  - ["ZA", 1442048400000, 79, 127, null, 1442059200000, -3, 1, 1]
+  - ["ZA", 1442059200000, 50, 127, 1442034000000, 1442070000000, -3, 1, 2]
+  - ["ZA", 1442070000000, 0, 127, 1442048400000, 1442091600000, -3, 1, 2]
+  - ["ZA", 1442091600000, 1, 127, 1442059200000, null, -3, 1, 3]
+  - ["ZM", 1442041200000, 133, 133, null, null, 133, 133, 1]
+  - ["ZW", 1442044800000, 0, 254, null, 1442048400000, 0, 254, 1]
+  - ["ZW", 1442048400000, 254, 254, null, null, 0, 254, 2]
\ No newline at end of file
diff --git a/web-console/lib/keywords.js b/web-console/lib/keywords.js
index e34b2daf45be..bc81153dd77e 100644
--- a/web-console/lib/keywords.js
+++ b/web-console/lib/keywords.js
@@ -61,6 +61,9 @@ exports.SQL_KEYWORDS = [
   'REPLACE INTO',
   'OVERWRITE',
   'RETURNING',
+  'OVER',
+  'PARTITION BY',
+  'WINDOW',
 ];
 
 exports.SQL_EXPRESSION_PARTS = [
diff --git a/web-console/package-lock.json b/web-console/package-lock.json
index 1821eb62bd7d..8776b62e3b55 100644
--- a/web-console/package-lock.json
+++ b/web-console/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "web-console",
-  "version": "25.0.0",
+  "version": "26.0.0",
   "lockfileVersion": 2,
   "requires": true,
   "packages": {
     "": {
       "name": "web-console",
-      "version": "25.0.0",
+      "version": "26.0.0",
       "license": "Apache-2.0",
       "dependencies": {
         "@blueprintjs/core": "^4.0.3",
@@ -103,7 +103,7 @@
         "postcss-loader": "^5.3.0",
         "postcss-preset-env": "^6.7.0",
         "prettier": "^2.5.1",
-        "replace": "^1.2.1",
+        "replace": "^1.2.2",
         "sass-loader": "^11.1.0",
         "snarkdown": "^2.0.0",
         "style-loader": "^2.0.0",
@@ -18238,9 +18238,9 @@
       "dev": true
     },
     "node_modules/minimatch": {
-      "version": "3.0.4",
-      "resolved": "https://registry.npmjs.org/minimatch/-/minimatch-3.0.4.tgz",
-      "integrity": "sha512-yJHVQEhyqPLUTgt9B83PXu6W3rx4MvvHvSUvToogpwoGDOUQ+yDrR0HRot+yOCdCO7u4hX3pWft6kWBBcqh0UA==",
+      "version": "3.0.5",
+      "resolved": "https://registry.npmjs.org/minimatch/-/minimatch-3.0.5.tgz",
+      "integrity": "sha512-tUpxzX0VAzJHjLu0xUfFv1gwVp9ba3IOuRAVH2EGuRW8a5emA2FlACLqiT/lDVtS1W+TGNwqz3sWaNyLgDJWuw==",
       "dev": true,
       "dependencies": {
         "brace-expansion": "^1.1.7"
@@ -22276,13 +22276,13 @@
       }
     },
     "node_modules/replace": {
-      "version": "1.2.1",
-      "resolved": "https://registry.npmjs.org/replace/-/replace-1.2.1.tgz",
-      "integrity": "sha512-KZCBe/tPanwBlbjSMQby4l+zjSiFi3CLEP/6VLClnRYgJ46DZ5u9tmA6ceWeFS8coaUnU4ZdGNb/puUGMHNSRg==",
+      "version": "1.2.2",
+      "resolved": "https://registry.npmjs.org/replace/-/replace-1.2.2.tgz",
+      "integrity": "sha512-C4EDifm22XZM2b2JOYe6Mhn+lBsLBAvLbK8drfUQLTfD1KYl/n3VaW/CDju0Ny4w3xTtegBpg8YNSpFJPUDSjA==",
       "dev": true,
       "dependencies": {
         "chalk": "2.4.2",
-        "minimatch": "3.0.4",
+        "minimatch": "3.0.5",
         "yargs": "^15.3.1"
       },
       "bin": {
@@ -41739,9 +41739,9 @@
       "dev": true
     },
     "minimatch": {
-      "version": "3.0.4",
-      "resolved": "https://registry.npmjs.org/minimatch/-/minimatch-3.0.4.tgz",
-      "integrity": "sha512-yJHVQEhyqPLUTgt9B83PXu6W3rx4MvvHvSUvToogpwoGDOUQ+yDrR0HRot+yOCdCO7u4hX3pWft6kWBBcqh0UA==",
+      "version": "3.0.5",
+      "resolved": "https://registry.npmjs.org/minimatch/-/minimatch-3.0.5.tgz",
+      "integrity": "sha512-tUpxzX0VAzJHjLu0xUfFv1gwVp9ba3IOuRAVH2EGuRW8a5emA2FlACLqiT/lDVtS1W+TGNwqz3sWaNyLgDJWuw==",
       "dev": true,
       "requires": {
         "brace-expansion": "^1.1.7"
@@ -44807,13 +44807,13 @@
       "dev": true
     },
     "replace": {
-      "version": "1.2.1",
-      "resolved": "https://registry.npmjs.org/replace/-/replace-1.2.1.tgz",
-      "integrity": "sha512-KZCBe/tPanwBlbjSMQby4l+zjSiFi3CLEP/6VLClnRYgJ46DZ5u9tmA6ceWeFS8coaUnU4ZdGNb/puUGMHNSRg==",
+      "version": "1.2.2",
+      "resolved": "https://registry.npmjs.org/replace/-/replace-1.2.2.tgz",
+      "integrity": "sha512-C4EDifm22XZM2b2JOYe6Mhn+lBsLBAvLbK8drfUQLTfD1KYl/n3VaW/CDju0Ny4w3xTtegBpg8YNSpFJPUDSjA==",
       "dev": true,
       "requires": {
         "chalk": "2.4.2",
-        "minimatch": "3.0.4",
+        "minimatch": "3.0.5",
         "yargs": "^15.3.1"
       },
       "dependencies": {
diff --git a/web-console/package.json b/web-console/package.json
index 8e3f0f1b515e..b8c33c6fdade 100644
--- a/web-console/package.json
+++ b/web-console/package.json
@@ -1,6 +1,6 @@
 {
   "name": "web-console",
-  "version": "25.0.0",
+  "version": "26.0.0",
   "description": "A web console for Apache Druid",
   "author": "Apache Druid Developers <dev@druid.apache.org>",
   "license": "Apache-2.0",
@@ -160,7 +160,7 @@
     "postcss-loader": "^5.3.0",
     "postcss-preset-env": "^6.7.0",
     "prettier": "^2.5.1",
-    "replace": "^1.2.1",
+    "replace": "^1.2.2",
     "sass-loader": "^11.1.0",
     "snarkdown": "^2.0.0",
     "style-loader": "^2.0.0",
diff --git a/web-console/pom.xml b/web-console/pom.xml
index 6e8f48f1a142..b624919ee41c 100644
--- a/web-console/pom.xml
+++ b/web-console/pom.xml
@@ -28,7 +28,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
   </parent>
 
   <properties>
diff --git a/web-console/script/create-sql-docs.js b/web-console/script/create-sql-docs.js
index 6af65006f8ef..13ed438915ba 100755
--- a/web-console/script/create-sql-docs.js
+++ b/web-console/script/create-sql-docs.js
@@ -52,9 +52,7 @@ function convertMarkdownToHtml(markdown) {
   // Concert to markdown
   markdown = snarkdown(markdown);
 
-  return markdown
-    .replace(/<br \/>/g, '<br /><br />') // Double up the <br>s
-    .replace(/<a[^>]*>(.*?)<\/a>/g, '$1'); // Remove links
+  return markdown.replace(/<a[^>]*>(.*?)<\/a>/g, '$1'); // Remove links
 }
 
 const readDoc = async () => {
diff --git a/web-console/src/bootstrap/react-table-defaults.tsx b/web-console/src/bootstrap/react-table-defaults.tsx
index 4c31928064cd..139a13bcd5a6 100644
--- a/web-console/src/bootstrap/react-table-defaults.tsx
+++ b/web-console/src/bootstrap/react-table-defaults.tsx
@@ -53,12 +53,12 @@ export function bootstrapReactTable() {
         .map((row: any) => row[column.id]);
       const previewCount = countBy(previewValues);
       return (
-        <span>
+        <div className="default-aggregated">
           {Object.keys(previewCount)
             .sort()
             .map(v => `${v} (${previewCount[v]})`)
             .join(', ')}
-        </span>
+        </div>
       );
     },
     defaultPageSize: 20,
diff --git a/web-console/src/components/auto-form/auto-form.scss b/web-console/src/components/auto-form/auto-form.scss
index 5523f0f8173f..c303abc294f5 100644
--- a/web-console/src/components/auto-form/auto-form.scss
+++ b/web-console/src/components/auto-form/auto-form.scss
@@ -16,16 +16,8 @@
  * limitations under the License.
  */
 
-@import '../../variables';
-
 .auto-form {
-  // Popover in info label
-  label.#{$bp-ns}-label {
-    position: relative;
-
-    .#{$bp-ns}-text-muted {
-      position: absolute;
-      right: 0;
-    }
+  .custom-input input {
+    cursor: pointer;
   }
 }
diff --git a/web-console/src/components/auto-form/auto-form.tsx b/web-console/src/components/auto-form/auto-form.tsx
index 1e56ef2b725d..146de61b6272 100644
--- a/web-console/src/components/auto-form/auto-form.tsx
+++ b/web-console/src/components/auto-form/auto-form.tsx
@@ -16,7 +16,14 @@
  * limitations under the License.
  */
 
-import { Button, ButtonGroup, FormGroup, Intent, NumericInput } from '@blueprintjs/core';
+import {
+  Button,
+  ButtonGroup,
+  FormGroup,
+  InputGroup,
+  Intent,
+  NumericInput,
+} from '@blueprintjs/core';
 import { IconNames } from '@blueprintjs/icons';
 import React from 'react';
 
@@ -46,7 +53,8 @@ export interface Field<M> {
     | 'boolean'
     | 'string-array'
     | 'json'
-    | 'interval';
+    | 'interval'
+    | 'custom';
   defaultValue?: any;
   emptyValue?: any;
   suggestions?: Functor<M, Suggestion[]>;
@@ -64,6 +72,13 @@ export interface Field<M> {
   valueAdjustment?: (value: any) => any;
   adjustment?: (model: Partial<M>) => Partial<M>;
   issueWithValue?: (value: any) => string | undefined;
+
+  customSummary?: (v: any) => string;
+  customDialog?: (o: {
+    value: any;
+    onValueChange: (v: any) => void;
+    onClose: () => void;
+  }) => JSX.Element;
 }
 
 interface ComputedFieldValues {
@@ -84,6 +99,7 @@ export interface AutoFormProps<M> {
 
 export interface AutoFormState {
   showMore: boolean;
+  customDialog?: JSX.Element;
 }
 
 export class AutoForm<T extends Record<string, any>> extends React.PureComponent<
@@ -395,6 +411,36 @@ export class AutoForm<T extends Record<string, any>> extends React.PureComponent
     );
   }
 
+  private renderCustomInput(field: Field<T>): JSX.Element {
+    const { model } = this.props;
+    const { required, defaultValue, modelValue } = AutoForm.computeFieldValues(model, field);
+    const effectiveValue = modelValue || defaultValue;
+
+    const onEdit = () => {
+      this.setState({
+        customDialog: field.customDialog?.({
+          value: effectiveValue,
+          onValueChange: v => this.fieldChange(field, v),
+          onClose: () => {
+            this.setState({ customDialog: undefined });
+          },
+        }),
+      });
+    };
+
+    return (
+      <InputGroup
+        className="custom-input"
+        value={(field.customSummary || String)(effectiveValue)}
+        intent={required && modelValue == null ? AutoForm.REQUIRED_INTENT : undefined}
+        readOnly
+        placeholder={AutoForm.evaluateFunctor(field.placeholder, model, '')}
+        rightElement={<Button icon={IconNames.EDIT} minimal onClick={onEdit} />}
+        onClick={onEdit}
+      />
+    );
+  }
+
   renderFieldInput(field: Field<T>) {
     switch (field.type) {
       case 'number':
@@ -413,6 +459,8 @@ export class AutoForm<T extends Record<string, any>> extends React.PureComponent
         return this.renderJsonInput(field);
       case 'interval':
         return this.renderIntervalInput(field);
+      case 'custom':
+        return this.renderCustomInput(field);
       default:
         throw new Error(`unknown field type '${field.type}'`);
     }
@@ -464,7 +512,7 @@ export class AutoForm<T extends Record<string, any>> extends React.PureComponent
 
   render(): JSX.Element {
     const { fields, model, showCustom } = this.props;
-    const { showMore } = this.state;
+    const { showMore, customDialog } = this.state;
 
     let shouldShowMore = false;
     const shownFields = fields.filter(field => {
@@ -489,6 +537,7 @@ export class AutoForm<T extends Record<string, any>> extends React.PureComponent
         {model && shownFields.map(this.renderField)}
         {model && showCustom && showCustom(model) && this.renderCustom()}
         {shouldShowMore && this.renderMoreOrLess()}
+        {customDialog}
       </div>
     );
   }
diff --git a/web-console/src/components/form-group-with-info/form-group-with-info.scss b/web-console/src/components/form-group-with-info/form-group-with-info.scss
index c9587cb088fa..a64c6d29274c 100644
--- a/web-console/src/components/form-group-with-info/form-group-with-info.scss
+++ b/web-console/src/components/form-group-with-info/form-group-with-info.scss
@@ -19,6 +19,20 @@
 @import '../../variables';
 
 .form-group-with-info {
+  label.#{$bp-ns}-label {
+    position: relative;
+
+    .#{$bp-ns}-text-muted {
+      position: absolute;
+      right: 0;
+
+      // This is only needed because BP4 alerts are too agro in setting CSS on icons
+      .#{$bp-ns}-icon {
+        margin-right: 0;
+      }
+    }
+  }
+
   .#{$bp-ns}-text-muted .#{$bp-ns}-popover2-target {
     margin-top: 0;
   }
diff --git a/web-console/src/components/segment-timeline/segment-timeline.tsx b/web-console/src/components/segment-timeline/segment-timeline.tsx
index c138e82dff25..f8cef06189b6 100644
--- a/web-console/src/components/segment-timeline/segment-timeline.tsx
+++ b/web-console/src/components/segment-timeline/segment-timeline.tsx
@@ -278,7 +278,7 @@ ORDER BY "start" DESC`;
             intervals = await queryDruidSql({
               query: SegmentTimeline.getSqlQuery(startDate, endDate),
             });
-            datasources = uniq(intervals.map(r => r.datasource));
+            datasources = uniq(intervals.map(r => r.datasource).sort());
           } else if (capabilities.hasCoordinatorAccess()) {
             const startIso = startDate.toISOString();
 
diff --git a/web-console/src/components/table-clickable-cell/table-clickable-cell.scss b/web-console/src/components/table-clickable-cell/table-clickable-cell.scss
index d6f6f8b2d7f7..5c5991df54e2 100644
--- a/web-console/src/components/table-clickable-cell/table-clickable-cell.scss
+++ b/web-console/src/components/table-clickable-cell/table-clickable-cell.scss
@@ -24,6 +24,10 @@
   overflow: hidden;
   text-overflow: ellipsis;
 
+  &.disabled {
+    cursor: not-allowed;
+  }
+
   .hover-icon {
     position: absolute;
     top: $table-cell-v-padding;
diff --git a/web-console/src/components/table-clickable-cell/table-clickable-cell.tsx b/web-console/src/components/table-clickable-cell/table-clickable-cell.tsx
index cc8cfd71e56d..7e4c66fdd5e5 100644
--- a/web-console/src/components/table-clickable-cell/table-clickable-cell.tsx
+++ b/web-console/src/components/table-clickable-cell/table-clickable-cell.tsx
@@ -27,18 +27,23 @@ export interface TableClickableCellProps {
   onClick: MouseEventHandler<any>;
   hoverIcon?: IconName;
   title?: string;
+  disabled?: boolean;
   children?: ReactNode;
 }
 
 export const TableClickableCell = React.memo(function TableClickableCell(
   props: TableClickableCellProps,
 ) {
-  const { className, onClick, hoverIcon, title, children } = props;
+  const { className, onClick, hoverIcon, title, disabled, children } = props;
 
   return (
-    <div className={classNames('table-clickable-cell', className)} title={title} onClick={onClick}>
+    <div
+      className={classNames('table-clickable-cell', className, { disabled })}
+      title={title}
+      onClick={disabled ? undefined : onClick}
+    >
       {children}
-      {hoverIcon && <Icon className="hover-icon" icon={hoverIcon} />}
+      {hoverIcon && !disabled && <Icon className="hover-icon" icon={hoverIcon} />}
     </div>
   );
 });
diff --git a/web-console/src/components/warning-checklist/warning-checklist.tsx b/web-console/src/components/warning-checklist/warning-checklist.tsx
index 449ad970045d..5c74cbdb08a0 100644
--- a/web-console/src/components/warning-checklist/warning-checklist.tsx
+++ b/web-console/src/components/warning-checklist/warning-checklist.tsx
@@ -17,29 +17,31 @@
  */
 
 import { Switch } from '@blueprintjs/core';
-import React, { useState } from 'react';
+import React, { ReactNode, useState } from 'react';
 
 export interface WarningChecklistProps {
-  checks: string[];
-  onChange: (allChecked: boolean) => void;
+  checks: ReactNode[];
+  onChange(allChecked: boolean): void;
 }
 
 export const WarningChecklist = React.memo(function WarningChecklist(props: WarningChecklistProps) {
   const { checks, onChange } = props;
-  const [checked, setChecked] = useState<Record<string, boolean>>({});
+  const [checked, setChecked] = useState<Record<number, boolean>>({});
 
-  function doCheck(check: string) {
+  function doCheck(checkIndex: number) {
     const newChecked = { ...checked };
-    newChecked[check] = !newChecked[check];
+    newChecked[checkIndex] = !newChecked[checkIndex];
     setChecked(newChecked);
 
-    onChange(checks.every(check => newChecked[check]));
+    onChange(checks.every((_, i) => newChecked[i]));
   }
 
   return (
     <div className="warning-checklist">
       {checks.map((check, i) => (
-        <Switch key={i} label={check} onChange={() => doCheck(check)} />
+        <Switch key={i} onChange={() => doCheck(i)}>
+          {check}
+        </Switch>
       ))}
     </div>
   );
diff --git a/web-console/src/dialogs/async-action-dialog/async-action-dialog.tsx b/web-console/src/dialogs/async-action-dialog/async-action-dialog.tsx
index f892936bab77..0d8cf385a5b6 100644
--- a/web-console/src/dialogs/async-action-dialog/async-action-dialog.tsx
+++ b/web-console/src/dialogs/async-action-dialog/async-action-dialog.tsx
@@ -47,7 +47,7 @@ export interface AsyncActionDialogProps {
   intent?: Intent;
   successText: string;
   failText: string;
-  warningChecks?: string[];
+  warningChecks?: ReactNode[];
   children?: ReactNode;
 }
 
diff --git a/web-console/src/dialogs/compaction-dialog/compaction-dialog.scss b/web-console/src/dialogs/compaction-dialog/compaction-dialog.scss
index e3ca37b14ea0..499df985c9e1 100644
--- a/web-console/src/dialogs/compaction-dialog/compaction-dialog.scss
+++ b/web-console/src/dialogs/compaction-dialog/compaction-dialog.scss
@@ -23,6 +23,11 @@
     height: 80vh;
   }
 
+  .legacy-callout {
+    width: auto;
+    margin: 10px 15px 0;
+  }
+
   .form-json-selector {
     margin: 15px;
   }
diff --git a/web-console/src/dialogs/compaction-dialog/compaction-dialog.tsx b/web-console/src/dialogs/compaction-dialog/compaction-dialog.tsx
index d63501b1b0b3..3b5456e7d049 100644
--- a/web-console/src/dialogs/compaction-dialog/compaction-dialog.tsx
+++ b/web-console/src/dialogs/compaction-dialog/compaction-dialog.tsx
@@ -16,11 +16,16 @@
  * limitations under the License.
  */
 
-import { Button, Classes, Dialog, Intent } from '@blueprintjs/core';
+import { Button, Callout, Classes, Code, Dialog, Intent } from '@blueprintjs/core';
 import React, { useState } from 'react';
 
 import { AutoForm, FormJsonSelector, FormJsonTabs, JsonInput } from '../../components';
-import { COMPACTION_CONFIG_FIELDS, CompactionConfig } from '../../druid-models';
+import {
+  COMPACTION_CONFIG_FIELDS,
+  CompactionConfig,
+  compactionConfigHasLegacyInputSegmentSizeBytesSet,
+} from '../../druid-models';
+import { deepDelete, formatBytesCompact } from '../../utils';
 
 import './compaction-dialog.scss';
 
@@ -55,13 +60,29 @@ export const CompactionDialog = React.memo(function CompactionDialog(props: Comp
       canOutsideClickClose={false}
       title={`Compaction config: ${datasource}`}
     >
+      {compactionConfigHasLegacyInputSegmentSizeBytesSet(currentConfig) && (
+        <Callout className="legacy-callout" intent={Intent.WARNING}>
+          <p>
+            You current config sets the legacy <Code>inputSegmentSizeBytes</Code> to{' '}
+            <Code>{formatBytesCompact(currentConfig.inputSegmentSizeBytes!)}</Code> it is
+            recommended to unset this property.
+          </p>
+          <p>
+            <Button
+              intent={Intent.WARNING}
+              text="Remove legacy setting"
+              onClick={() => setCurrentConfig(deepDelete(currentConfig, 'inputSegmentSizeBytes'))}
+            />
+          </p>
+        </Callout>
+      )}
       <FormJsonSelector tab={currentTab} onChange={setCurrentTab} />
       <div className="content">
         {currentTab === 'form' ? (
           <AutoForm
             fields={COMPACTION_CONFIG_FIELDS}
             model={currentConfig}
-            onChange={m => setCurrentConfig(m)}
+            onChange={m => setCurrentConfig(m as CompactionConfig)}
           />
         ) : (
           <JsonInput
diff --git a/web-console/src/dialogs/index-spec-dialog/__snapshots__/index-spec-dialog.spec.tsx.snap b/web-console/src/dialogs/index-spec-dialog/__snapshots__/index-spec-dialog.spec.tsx.snap
new file mode 100644
index 000000000000..57d989621b70
--- /dev/null
+++ b/web-console/src/dialogs/index-spec-dialog/__snapshots__/index-spec-dialog.spec.tsx.snap
@@ -0,0 +1,317 @@
+// Jest Snapshot v1, https://goo.gl/fbAQLP
+
+exports[`IndexSpecDialog matches snapshot with indexSpec 1`] = `
+<Blueprint4.Dialog
+  canOutsideClickClose={false}
+  className="index-spec-dialog"
+  isOpen={true}
+  onClose={[Function]}
+  title="Index spec"
+>
+  <Memo(FormJsonSelector)
+    onChange={[Function]}
+    tab="form"
+  />
+  <div
+    className="content"
+  >
+    <AutoForm
+      fields={
+        Array [
+          Object {
+            "defaultValue": "utf8",
+            "info": <React.Fragment>
+              Encoding format for STRING value dictionaries used by STRING and COMPLEX&lt;json&gt; columns.
+            </React.Fragment>,
+            "label": "String dictionary encoding",
+            "name": "stringDictionaryEncoding.type",
+            "suggestions": Array [
+              "utf8",
+              "frontCoded",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": 4,
+            "defined": [Function],
+            "info": <React.Fragment>
+              The number of values to place in a bucket to perform delta encoding. Must be a power of 2, maximum is 128.
+            </React.Fragment>,
+            "label": "String dictionary encoding bucket size",
+            "max": 128,
+            "min": 1,
+            "name": "stringDictionaryEncoding.bucketSize",
+            "type": "number",
+          },
+          Object {
+            "defaultValue": "roaring",
+            "info": <React.Fragment>
+              Compression format for bitmap indexes.
+            </React.Fragment>,
+            "label": "Bitmap type",
+            "name": "bitmap.type",
+            "suggestions": Array [
+              "roaring",
+              "concise",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": true,
+            "defined": [Function],
+            "info": <React.Fragment>
+              Controls whether or not run-length encoding will be used when it is determined to be more space-efficient.
+            </React.Fragment>,
+            "label": "Bitmap compress run on serialization",
+            "name": "bitmap.compressRunOnSerialization",
+            "type": "boolean",
+          },
+          Object {
+            "defaultValue": "lz4",
+            "info": <React.Fragment>
+              Compression format for dimension columns.
+            </React.Fragment>,
+            "name": "dimensionCompression",
+            "suggestions": Array [
+              "lz4",
+              "lzf",
+              "zstd",
+              "uncompressed",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": "longs",
+            "info": <React.Fragment>
+              Encoding format for long-typed columns. Applies regardless of whether they are dimensions or metrics. 
+              <Unknown>
+                auto
+              </Unknown>
+               encodes the values using offset or lookup table depending on column cardinality, and store them with variable size. 
+              <Unknown>
+                longs
+              </Unknown>
+               stores the value as-is with 8 bytes each.
+            </React.Fragment>,
+            "name": "longEncoding",
+            "suggestions": Array [
+              "longs",
+              "auto",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": "lz4",
+            "info": <React.Fragment>
+              Compression format for primitive type metric columns.
+            </React.Fragment>,
+            "name": "metricCompression",
+            "suggestions": Array [
+              "lz4",
+              "lzf",
+              "zstd",
+              "uncompressed",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": "lz4",
+            "info": <React.Fragment>
+              Compression format to use for nested column raw data. 
+            </React.Fragment>,
+            "label": "JSON compression",
+            "name": "jsonCompression",
+            "suggestions": Array [
+              "lz4",
+              "lzf",
+              "zstd",
+              "uncompressed",
+            ],
+            "type": "string",
+          },
+        ]
+      }
+      model={
+        Object {
+          "dimensionCompression": "lzf",
+        }
+      }
+      onChange={[Function]}
+    />
+  </div>
+  <div
+    className="bp4-dialog-footer"
+  >
+    <div
+      className="bp4-dialog-footer-actions"
+    >
+      <Blueprint4.Button
+        onClick={[Function]}
+        text="Close"
+      />
+      <Blueprint4.Button
+        disabled={false}
+        intent="primary"
+        onClick={[Function]}
+        text="Save"
+      />
+    </div>
+  </div>
+</Blueprint4.Dialog>
+`;
+
+exports[`IndexSpecDialog matches snapshot without compactionConfig 1`] = `
+<Blueprint4.Dialog
+  canOutsideClickClose={false}
+  className="index-spec-dialog"
+  isOpen={true}
+  onClose={[Function]}
+  title="Index spec"
+>
+  <Memo(FormJsonSelector)
+    onChange={[Function]}
+    tab="form"
+  />
+  <div
+    className="content"
+  >
+    <AutoForm
+      fields={
+        Array [
+          Object {
+            "defaultValue": "utf8",
+            "info": <React.Fragment>
+              Encoding format for STRING value dictionaries used by STRING and COMPLEX&lt;json&gt; columns.
+            </React.Fragment>,
+            "label": "String dictionary encoding",
+            "name": "stringDictionaryEncoding.type",
+            "suggestions": Array [
+              "utf8",
+              "frontCoded",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": 4,
+            "defined": [Function],
+            "info": <React.Fragment>
+              The number of values to place in a bucket to perform delta encoding. Must be a power of 2, maximum is 128.
+            </React.Fragment>,
+            "label": "String dictionary encoding bucket size",
+            "max": 128,
+            "min": 1,
+            "name": "stringDictionaryEncoding.bucketSize",
+            "type": "number",
+          },
+          Object {
+            "defaultValue": "roaring",
+            "info": <React.Fragment>
+              Compression format for bitmap indexes.
+            </React.Fragment>,
+            "label": "Bitmap type",
+            "name": "bitmap.type",
+            "suggestions": Array [
+              "roaring",
+              "concise",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": true,
+            "defined": [Function],
+            "info": <React.Fragment>
+              Controls whether or not run-length encoding will be used when it is determined to be more space-efficient.
+            </React.Fragment>,
+            "label": "Bitmap compress run on serialization",
+            "name": "bitmap.compressRunOnSerialization",
+            "type": "boolean",
+          },
+          Object {
+            "defaultValue": "lz4",
+            "info": <React.Fragment>
+              Compression format for dimension columns.
+            </React.Fragment>,
+            "name": "dimensionCompression",
+            "suggestions": Array [
+              "lz4",
+              "lzf",
+              "zstd",
+              "uncompressed",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": "longs",
+            "info": <React.Fragment>
+              Encoding format for long-typed columns. Applies regardless of whether they are dimensions or metrics. 
+              <Unknown>
+                auto
+              </Unknown>
+               encodes the values using offset or lookup table depending on column cardinality, and store them with variable size. 
+              <Unknown>
+                longs
+              </Unknown>
+               stores the value as-is with 8 bytes each.
+            </React.Fragment>,
+            "name": "longEncoding",
+            "suggestions": Array [
+              "longs",
+              "auto",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": "lz4",
+            "info": <React.Fragment>
+              Compression format for primitive type metric columns.
+            </React.Fragment>,
+            "name": "metricCompression",
+            "suggestions": Array [
+              "lz4",
+              "lzf",
+              "zstd",
+              "uncompressed",
+            ],
+            "type": "string",
+          },
+          Object {
+            "defaultValue": "lz4",
+            "info": <React.Fragment>
+              Compression format to use for nested column raw data. 
+            </React.Fragment>,
+            "label": "JSON compression",
+            "name": "jsonCompression",
+            "suggestions": Array [
+              "lz4",
+              "lzf",
+              "zstd",
+              "uncompressed",
+            ],
+            "type": "string",
+          },
+        ]
+      }
+      model={Object {}}
+      onChange={[Function]}
+    />
+  </div>
+  <div
+    className="bp4-dialog-footer"
+  >
+    <div
+      className="bp4-dialog-footer-actions"
+    >
+      <Blueprint4.Button
+        onClick={[Function]}
+        text="Close"
+      />
+      <Blueprint4.Button
+        disabled={false}
+        intent="primary"
+        onClick={[Function]}
+        text="Save"
+      />
+    </div>
+  </div>
+</Blueprint4.Dialog>
+`;
diff --git a/web-console/src/dialogs/index-spec-dialog/index-spec-dialog.scss b/web-console/src/dialogs/index-spec-dialog/index-spec-dialog.scss
new file mode 100644
index 000000000000..e7cc53ee47dd
--- /dev/null
+++ b/web-console/src/dialogs/index-spec-dialog/index-spec-dialog.scss
@@ -0,0 +1,36 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+@import '../../variables';
+
+.index-spec-dialog {
+  &.#{$bp-ns}-dialog {
+    height: 70vh;
+  }
+
+  .form-json-selector {
+    margin: 15px;
+  }
+
+  .content {
+    margin: 0 15px 10px 0;
+    padding: 0 5px 0 15px;
+    flex: 1;
+    overflow: auto;
+  }
+}
diff --git a/web-console/src/dialogs/index-spec-dialog/index-spec-dialog.spec.tsx b/web-console/src/dialogs/index-spec-dialog/index-spec-dialog.spec.tsx
new file mode 100644
index 000000000000..68f7f56b885b
--- /dev/null
+++ b/web-console/src/dialogs/index-spec-dialog/index-spec-dialog.spec.tsx
@@ -0,0 +1,44 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import { shallow } from 'enzyme';
+import React from 'react';
+
+import { IndexSpecDialog } from './index-spec-dialog';
+
+describe('IndexSpecDialog', () => {
+  it('matches snapshot without compactionConfig', () => {
+    const compactionDialog = shallow(
+      <IndexSpecDialog onClose={() => {}} onSave={() => {}} indexSpec={undefined} />,
+    );
+    expect(compactionDialog).toMatchSnapshot();
+  });
+
+  it('matches snapshot with indexSpec', () => {
+    const compactionDialog = shallow(
+      <IndexSpecDialog
+        onClose={() => {}}
+        onSave={() => {}}
+        indexSpec={{
+          dimensionCompression: 'lzf',
+        }}
+      />,
+    );
+    expect(compactionDialog).toMatchSnapshot();
+  });
+});
diff --git a/web-console/src/dialogs/index-spec-dialog/index-spec-dialog.tsx b/web-console/src/dialogs/index-spec-dialog/index-spec-dialog.tsx
new file mode 100644
index 000000000000..4c870df45af2
--- /dev/null
+++ b/web-console/src/dialogs/index-spec-dialog/index-spec-dialog.tsx
@@ -0,0 +1,88 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import { Button, Classes, Dialog, Intent } from '@blueprintjs/core';
+import React, { useState } from 'react';
+
+import { AutoForm, FormJsonSelector, FormJsonTabs, JsonInput } from '../../components';
+import { INDEX_SPEC_FIELDS, IndexSpec } from '../../druid-models';
+
+import './index-spec-dialog.scss';
+
+export interface IndexSpecDialogProps {
+  title?: string;
+  onClose: () => void;
+  onSave: (indexSpec: IndexSpec) => void;
+  indexSpec: IndexSpec | undefined;
+}
+
+export const IndexSpecDialog = React.memo(function IndexSpecDialog(props: IndexSpecDialogProps) {
+  const { title, indexSpec, onSave, onClose } = props;
+
+  const [currentTab, setCurrentTab] = useState<FormJsonTabs>('form');
+  const [currentIndexSpec, setCurrentIndexSpec] = useState<IndexSpec>(indexSpec || {});
+  const [jsonError, setJsonError] = useState<Error | undefined>();
+
+  const issueWithCurrentIndexSpec = AutoForm.issueWithModel(currentIndexSpec, INDEX_SPEC_FIELDS);
+
+  return (
+    <Dialog
+      className="index-spec-dialog"
+      isOpen
+      onClose={onClose}
+      canOutsideClickClose={false}
+      title={title ?? 'Index spec'}
+    >
+      <FormJsonSelector tab={currentTab} onChange={setCurrentTab} />
+      <div className="content">
+        {currentTab === 'form' ? (
+          <AutoForm
+            fields={INDEX_SPEC_FIELDS}
+            model={currentIndexSpec}
+            onChange={m => setCurrentIndexSpec(m)}
+          />
+        ) : (
+          <JsonInput
+            value={currentIndexSpec}
+            onChange={v => {
+              setCurrentIndexSpec(v);
+              setJsonError(undefined);
+            }}
+            onError={setJsonError}
+            issueWithValue={value => AutoForm.issueWithModel(value, INDEX_SPEC_FIELDS)}
+            height="100%"
+          />
+        )}
+      </div>
+      <div className={Classes.DIALOG_FOOTER}>
+        <div className={Classes.DIALOG_FOOTER_ACTIONS}>
+          <Button text="Close" onClick={onClose} />
+          <Button
+            text="Save"
+            intent={Intent.PRIMARY}
+            disabled={Boolean(jsonError || issueWithCurrentIndexSpec)}
+            onClick={() => {
+              onSave(currentIndexSpec);
+              onClose();
+            }}
+          />
+        </div>
+      </div>
+    </Dialog>
+  );
+});
diff --git a/web-console/src/dialogs/index.ts b/web-console/src/dialogs/index.ts
index 9509442c8bd2..588257c84e74 100644
--- a/web-console/src/dialogs/index.ts
+++ b/web-console/src/dialogs/index.ts
@@ -24,6 +24,7 @@ export * from './diff-dialog/diff-dialog';
 export * from './doctor-dialog/doctor-dialog';
 export * from './edit-context-dialog/edit-context-dialog';
 export * from './history-dialog/history-dialog';
+export * from './kill-datasource-dialog/kill-datasource-dialog';
 export * from './lookup-edit-dialog/lookup-edit-dialog';
 export * from './numeric-input-dialog/numeric-input-dialog';
 export * from './overlord-dynamic-config-dialog/overlord-dynamic-config-dialog';
diff --git a/web-console/src/dialogs/kill-datasource-dialog/kill-datasource-dialog.tsx b/web-console/src/dialogs/kill-datasource-dialog/kill-datasource-dialog.tsx
new file mode 100644
index 000000000000..3eb7e9fdf243
--- /dev/null
+++ b/web-console/src/dialogs/kill-datasource-dialog/kill-datasource-dialog.tsx
@@ -0,0 +1,110 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import { Code, Intent } from '@blueprintjs/core';
+import React, { useState } from 'react';
+
+import { FormGroupWithInfo, PopoverText } from '../../components';
+import { SuggestibleInput } from '../../components/suggestible-input/suggestible-input';
+import { Api } from '../../singletons';
+import { uniq } from '../../utils';
+import { AsyncActionDialog } from '../async-action-dialog/async-action-dialog';
+
+function getSuggestions(): string[] {
+  // Default to a data 24h ago so as not to cause a conflict between streaming ingestion and kill tasks
+  const end = new Date(Date.now() - 24 * 60 * 60 * 1000).toISOString();
+  const startOfDay = end.slice(0, 10);
+  const startOfMonth = end.slice(0, 7) + '-01';
+  const startOfYear = end.slice(0, 4) + '-01-01';
+
+  return uniq([
+    `1000-01-01/${startOfDay}`,
+    `1000-01-01/${startOfMonth}`,
+    `1000-01-01/${startOfYear}`,
+    '1000-01-01/3000-01-01',
+  ]);
+}
+
+export interface KillDatasourceDialogProps {
+  datasource: string;
+  onClose(): void;
+  onSuccess(): void;
+}
+
+export const KillDatasourceDialog = function KillDatasourceDialog(
+  props: KillDatasourceDialogProps,
+) {
+  const { datasource, onClose, onSuccess } = props;
+  const suggestions = getSuggestions();
+  const [interval, setInterval] = useState<string>(suggestions[0]);
+
+  return (
+    <AsyncActionDialog
+      className="kill-datasource-dialog"
+      action={async () => {
+        const resp = await Api.instance.delete(
+          `/druid/coordinator/v1/datasources/${Api.encodePath(
+            datasource,
+          )}?kill=true&interval=${Api.encodePath(interval)}`,
+          {},
+        );
+        return resp.data;
+      }}
+      confirmButtonText="Permanently delete unused segments"
+      successText="Kill task was issued. Unused segments in datasource will be deleted"
+      failText="Failed submit kill task"
+      intent={Intent.DANGER}
+      onClose={onClose}
+      onSuccess={onSuccess}
+      warningChecks={[
+        <>
+          I understand that this operation will delete all metadata about the unused segments of{' '}
+          <Code>{datasource}</Code> and removes them from deep storage.
+        </>,
+        'I understand that this operation cannot be undone.',
+      ]}
+    >
+      <p>
+        Are you sure you want to permanently delete unused segments in <Code>{datasource}</Code>?
+      </p>
+      <p>This action is not reversible and the data deleted will be lost.</p>
+      <FormGroupWithInfo
+        label="Interval to delete"
+        info={
+          <PopoverText>
+            <p>
+              The range of time over which to delete unused segments specified in ISO8601 interval
+              format.
+            </p>
+            <p>
+              If you have streaming ingestion running make sure that your interval range doe not
+              overlap with intervals where streaming data is being added - otherwise the kill task
+              will not start.
+            </p>
+          </PopoverText>
+        }
+      >
+        <SuggestibleInput
+          value={interval}
+          onValueChange={s => setInterval(s || '')}
+          suggestions={suggestions}
+        />
+      </FormGroupWithInfo>
+    </AsyncActionDialog>
+  );
+};
diff --git a/web-console/src/druid-models/compaction-config/compaction-config.tsx b/web-console/src/druid-models/compaction-config/compaction-config.tsx
index 1958f2b263e3..b03b66ea0ead 100644
--- a/web-console/src/druid-models/compaction-config/compaction-config.tsx
+++ b/web-console/src/druid-models/compaction-config/compaction-config.tsx
@@ -22,7 +22,26 @@ import React from 'react';
 import { Field } from '../../components';
 import { deepGet, deepSet, oneOf } from '../../utils';
 
-export type CompactionConfig = Record<string, any>;
+export interface CompactionConfig {
+  dataSource: string;
+  skipOffsetFromLatest?: string;
+  tuningConfig?: any;
+  [key: string]: any;
+
+  // Deprecated:
+  inputSegmentSizeBytes?: number;
+}
+
+export const NOOP_INPUT_SEGMENT_SIZE_BYTES = 100000000000000;
+
+export function compactionConfigHasLegacyInputSegmentSizeBytesSet(
+  config: CompactionConfig,
+): boolean {
+  return (
+    typeof config.inputSegmentSizeBytes === 'number' &&
+    config.inputSegmentSizeBytes < NOOP_INPUT_SEGMENT_SIZE_BYTES
+  );
+}
 
 export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   {
@@ -182,7 +201,7 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
     defined: t =>
       oneOf(deepGet(t, 'tuningConfig.partitionsSpec.type'), 'single_dim', 'range') &&
       !deepGet(t, 'tuningConfig.partitionsSpec.maxRowsPerSegment'),
-    required: (t: CompactionConfig) =>
+    required: t =>
       !deepGet(t, 'tuningConfig.partitionsSpec.targetRowsPerSegment') &&
       !deepGet(t, 'tuningConfig.partitionsSpec.maxRowsPerSegment'),
     info: (
@@ -205,7 +224,7 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
     defined: t =>
       oneOf(deepGet(t, 'tuningConfig.partitionsSpec.type'), 'single_dim', 'range') &&
       !deepGet(t, 'tuningConfig.partitionsSpec.targetRowsPerSegment'),
-    required: (t: CompactionConfig) =>
+    required: t =>
       !deepGet(t, 'tuningConfig.partitionsSpec.targetRowsPerSegment') &&
       !deepGet(t, 'tuningConfig.partitionsSpec.maxRowsPerSegment'),
     info: (
@@ -277,7 +296,7 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
     defaultValue: 1073741824,
     min: 1000000,
     hideInMore: true,
-    adjustment: (t: CompactionConfig) => deepSet(t, 'tuningConfig.splitHintSpec.type', 'maxSize'),
+    adjustment: t => deepSet(t, 'tuningConfig.splitHintSpec.type', 'maxSize'),
     info: (
       <>
         Maximum number of bytes of input segments to process in a single task. If a single segment
@@ -293,7 +312,7 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
     defaultValue: 1000,
     min: 1,
     hideInMore: true,
-    adjustment: (t: CompactionConfig) => deepSet(t, 'tuningConfig.splitHintSpec.type', 'maxSize'),
+    adjustment: t => deepSet(t, 'tuningConfig.splitHintSpec.type', 'maxSize'),
     info: (
       <>
         Maximum number of input segments to process in a single subtask. This limit is to avoid task
diff --git a/web-console/src/druid-models/compaction-status/compaction-status.spec.ts b/web-console/src/druid-models/compaction-status/compaction-status.spec.ts
index 8ed0c5141366..abe660e5c26d 100644
--- a/web-console/src/druid-models/compaction-status/compaction-status.spec.ts
+++ b/web-console/src/druid-models/compaction-status/compaction-status.spec.ts
@@ -18,14 +18,16 @@
 
 import { CompactionConfig } from '../compaction-config/compaction-config';
 
-import {
-  CompactionStatus,
-  formatCompactionConfigAndStatus,
-  zeroCompactionStatus,
-} from './compaction-status';
+import { CompactionStatus, formatCompactionInfo, zeroCompactionStatus } from './compaction-status';
 
 describe('compaction status', () => {
-  const BASIC_CONFIG: CompactionConfig = {};
+  const BASIC_CONFIG: CompactionConfig = {
+    dataSource: 'tbl',
+  };
+  const LEGACY_CONFIG: CompactionConfig = {
+    dataSource: 'tbl',
+    inputSegmentSizeBytes: 1e6,
+  };
   const ZERO_STATUS: CompactionStatus = {
     dataSource: 'tbl',
     scheduleStatus: 'RUNNING',
@@ -40,49 +42,112 @@ describe('compaction status', () => {
     intervalCountSkipped: 0,
   };
 
-  it('zeroCompactionStatus', () => {
-    expect(zeroCompactionStatus(ZERO_STATUS)).toEqual(true);
+  describe('zeroCompactionStatus', () => {
+    it('works with zero', () => {
+      expect(zeroCompactionStatus(ZERO_STATUS)).toEqual(true);
+    });
 
-    expect(
-      zeroCompactionStatus({
-        dataSource: 'tbl',
-        scheduleStatus: 'RUNNING',
-        bytesAwaitingCompaction: 1,
-        bytesCompacted: 0,
-        bytesSkipped: 0,
-        segmentCountAwaitingCompaction: 0,
-        segmentCountCompacted: 0,
-        segmentCountSkipped: 0,
-        intervalCountAwaitingCompaction: 0,
-        intervalCountCompacted: 0,
-        intervalCountSkipped: 0,
-      }),
-    ).toEqual(false);
+    it('works with non-zero', () => {
+      expect(
+        zeroCompactionStatus({
+          dataSource: 'tbl',
+          scheduleStatus: 'RUNNING',
+          bytesAwaitingCompaction: 1,
+          bytesCompacted: 0,
+          bytesSkipped: 0,
+          segmentCountAwaitingCompaction: 0,
+          segmentCountCompacted: 0,
+          segmentCountSkipped: 0,
+          intervalCountAwaitingCompaction: 0,
+          intervalCountCompacted: 0,
+          intervalCountSkipped: 0,
+        }),
+      ).toEqual(false);
+    });
   });
 
-  it('formatCompactionConfigAndStatus', () => {
-    expect(formatCompactionConfigAndStatus(undefined, undefined)).toEqual('Not enabled');
+  describe('formatCompactionConfigAndStatus', () => {
+    it('works with nothing', () => {
+      expect(formatCompactionInfo({})).toEqual('Not enabled');
+    });
+
+    it('works when there is no status', () => {
+      expect(formatCompactionInfo({ config: BASIC_CONFIG })).toEqual('Awaiting first run');
+    });
+
+    it('works when here is no config', () => {
+      expect(formatCompactionInfo({ status: ZERO_STATUS })).toEqual('Not enabled');
+    });
 
-    expect(formatCompactionConfigAndStatus(BASIC_CONFIG, undefined)).toEqual('Awaiting first run');
+    it('works with config and zero status', () => {
+      expect(formatCompactionInfo({ config: BASIC_CONFIG, status: ZERO_STATUS })).toEqual(
+        'Running',
+      );
+    });
 
-    expect(formatCompactionConfigAndStatus(undefined, ZERO_STATUS)).toEqual('Not enabled');
+    it('works when fully compacted', () => {
+      expect(
+        formatCompactionInfo({
+          config: BASIC_CONFIG,
+          status: {
+            dataSource: 'tbl',
+            scheduleStatus: 'RUNNING',
+            bytesAwaitingCompaction: 0,
+            bytesCompacted: 100,
+            bytesSkipped: 0,
+            segmentCountAwaitingCompaction: 0,
+            segmentCountCompacted: 10,
+            segmentCountSkipped: 0,
+            intervalCountAwaitingCompaction: 0,
+            intervalCountCompacted: 10,
+            intervalCountSkipped: 0,
+          },
+        }),
+      ).toEqual('Fully compacted');
+    });
 
-    expect(formatCompactionConfigAndStatus(BASIC_CONFIG, ZERO_STATUS)).toEqual('Running');
+    it('works when fully compacted and some segments skipped', () => {
+      expect(
+        formatCompactionInfo({
+          config: BASIC_CONFIG,
+          status: {
+            dataSource: 'tbl',
+            scheduleStatus: 'RUNNING',
+            bytesAwaitingCompaction: 0,
+            bytesCompacted: 0,
+            bytesSkipped: 3776979,
+            segmentCountAwaitingCompaction: 0,
+            segmentCountCompacted: 0,
+            segmentCountSkipped: 24,
+            intervalCountAwaitingCompaction: 0,
+            intervalCountCompacted: 0,
+            intervalCountSkipped: 24,
+          },
+        }),
+      ).toEqual('Fully compacted (except the last P1D of data, 24 segments skipped)');
+    });
 
-    expect(
-      formatCompactionConfigAndStatus(BASIC_CONFIG, {
-        dataSource: 'tbl',
-        scheduleStatus: 'RUNNING',
-        bytesAwaitingCompaction: 0,
-        bytesCompacted: 100,
-        bytesSkipped: 0,
-        segmentCountAwaitingCompaction: 0,
-        segmentCountCompacted: 10,
-        segmentCountSkipped: 0,
-        intervalCountAwaitingCompaction: 0,
-        intervalCountCompacted: 10,
-        intervalCountSkipped: 0,
-      }),
-    ).toEqual('Fully compacted');
+    it('works when fully compacted and some segments skipped (with legacy config)', () => {
+      expect(
+        formatCompactionInfo({
+          config: LEGACY_CONFIG,
+          status: {
+            dataSource: 'tbl',
+            scheduleStatus: 'RUNNING',
+            bytesAwaitingCompaction: 0,
+            bytesCompacted: 0,
+            bytesSkipped: 3776979,
+            segmentCountAwaitingCompaction: 0,
+            segmentCountCompacted: 0,
+            segmentCountSkipped: 24,
+            intervalCountAwaitingCompaction: 0,
+            intervalCountCompacted: 0,
+            intervalCountSkipped: 24,
+          },
+        }),
+      ).toEqual(
+        'Fully compacted (except the last P1D of data and segments larger than 1.00MB, 24 segments skipped)',
+      );
+    });
   });
 });
diff --git a/web-console/src/druid-models/compaction-status/compaction-status.ts b/web-console/src/druid-models/compaction-status/compaction-status.ts
index 2982d9b69e17..c19cb26b6c2a 100644
--- a/web-console/src/druid-models/compaction-status/compaction-status.ts
+++ b/web-console/src/druid-models/compaction-status/compaction-status.ts
@@ -16,7 +16,11 @@
  * limitations under the License.
  */
 
-import { CompactionConfig } from '../compaction-config/compaction-config';
+import { formatBytesCompact, pluralIfNeeded } from '../../utils';
+import {
+  CompactionConfig,
+  compactionConfigHasLegacyInputSegmentSizeBytesSet,
+} from '../compaction-config/compaction-config';
 
 function capitalizeFirst(str: string): string {
   return str.slice(0, 1).toUpperCase() + str.slice(1).toLowerCase();
@@ -50,19 +54,32 @@ export function zeroCompactionStatus(compactionStatus: CompactionStatus): boolea
   );
 }
 
-export function formatCompactionConfigAndStatus(
-  compactionConfig: CompactionConfig | undefined,
-  compactionStatus: CompactionStatus | undefined,
-) {
-  if (compactionConfig) {
-    if (compactionStatus) {
+export interface CompactionInfo {
+  config?: CompactionConfig;
+  status?: CompactionStatus;
+}
+
+export function formatCompactionInfo(compaction: CompactionInfo) {
+  const { config, status } = compaction;
+  if (config) {
+    if (status) {
       if (
-        compactionStatus.bytesAwaitingCompaction === 0 &&
-        !zeroCompactionStatus(compactionStatus)
+        status.bytesAwaitingCompaction === 0 &&
+        status.segmentCountAwaitingCompaction === 0 &&
+        status.intervalCountAwaitingCompaction === 0 &&
+        !zeroCompactionStatus(status)
       ) {
-        return 'Fully compacted';
+        if (status.segmentCountSkipped) {
+          return `Fully compacted (except the last ${config.skipOffsetFromLatest || 'P1D'} of data${
+            compactionConfigHasLegacyInputSegmentSizeBytesSet(config)
+              ? ` and segments larger than ${formatBytesCompact(config.inputSegmentSizeBytes!)}`
+              : ''
+          }, ${pluralIfNeeded(status.segmentCountSkipped, 'segment')} skipped)`;
+        } else {
+          return 'Fully compacted';
+        }
       } else {
-        return capitalizeFirst(compactionStatus.scheduleStatus);
+        return capitalizeFirst(status.scheduleStatus);
       }
     } else {
       return 'Awaiting first run';
diff --git a/web-console/src/druid-models/coordinator-dynamic-config/coordinator-dynamic-config.tsx b/web-console/src/druid-models/coordinator-dynamic-config/coordinator-dynamic-config.tsx
index eeb25db09c4b..ca957309ff83 100644
--- a/web-console/src/druid-models/coordinator-dynamic-config/coordinator-dynamic-config.tsx
+++ b/web-console/src/druid-models/coordinator-dynamic-config/coordinator-dynamic-config.tsx
@@ -69,20 +69,9 @@ export const COORDINATOR_DYNAMIC_CONFIG_FIELDS: Field<CoordinatorDynamicConfig>[
       </>
     ),
   },
-  {
-    name: 'killAllDataSources',
-    type: 'boolean',
-    defaultValue: false,
-    info: (
-      <>
-        Send kill tasks for ALL dataSources if property <Code>druid.coordinator.kill.on</Code> is
-        true. If this is set to true then <Code>killDataSourceWhitelist</Code> must not be specified
-        or be empty list.
-      </>
-    ),
-  },
   {
     name: 'killDataSourceWhitelist',
+    label: 'Kill datasource whitelist',
     type: 'string-array',
     emptyValue: [],
     info: (
diff --git a/web-console/src/druid-models/index-spec/index-spec.tsx b/web-console/src/druid-models/index-spec/index-spec.tsx
new file mode 100644
index 000000000000..1a4246299661
--- /dev/null
+++ b/web-console/src/druid-models/index-spec/index-spec.tsx
@@ -0,0 +1,158 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import { Code } from '@blueprintjs/core';
+import React from 'react';
+
+import { Field } from '../../components';
+import { deepGet } from '../../utils';
+
+export interface IndexSpec {
+  bitmap?: Bitmap;
+  dimensionCompression?: string;
+  stringDictionaryEncoding?: { type: 'utf8' | 'frontCoded'; bucketSize: number };
+  metricCompression?: string;
+  longEncoding?: string;
+  jsonCompression?: string;
+}
+
+export interface Bitmap {
+  type: string;
+  compressRunOnSerialization?: boolean;
+}
+
+export function summarizeIndexSpec(indexSpec: IndexSpec | undefined): string {
+  if (!indexSpec) return '';
+
+  const { stringDictionaryEncoding, bitmap, longEncoding } = indexSpec;
+
+  const ret: string[] = [];
+  if (stringDictionaryEncoding) {
+    switch (stringDictionaryEncoding.type) {
+      case 'frontCoded':
+        ret.push(`frontCoded(${stringDictionaryEncoding.bucketSize || 4})`);
+        break;
+
+      default:
+        ret.push(stringDictionaryEncoding.type);
+        break;
+    }
+  }
+
+  if (bitmap) {
+    ret.push(bitmap.type);
+  }
+
+  if (longEncoding) {
+    ret.push(longEncoding);
+  }
+
+  return ret.join('; ');
+}
+
+export const INDEX_SPEC_FIELDS: Field<IndexSpec>[] = [
+  {
+    name: 'stringDictionaryEncoding.type',
+    label: 'String dictionary encoding',
+    type: 'string',
+    defaultValue: 'utf8',
+    suggestions: ['utf8', 'frontCoded'],
+    info: (
+      <>
+        Encoding format for STRING value dictionaries used by STRING and COMPLEX&lt;json&gt;
+        columns.
+      </>
+    ),
+  },
+  {
+    name: 'stringDictionaryEncoding.bucketSize',
+    label: 'String dictionary encoding bucket size',
+    type: 'number',
+    defaultValue: 4,
+    min: 1,
+    max: 128,
+    defined: spec => deepGet(spec, 'stringDictionaryEncoding.type') === 'frontCoded',
+    info: (
+      <>
+        The number of values to place in a bucket to perform delta encoding. Must be a power of 2,
+        maximum is 128.
+      </>
+    ),
+  },
+
+  {
+    name: 'bitmap.type',
+    label: 'Bitmap type',
+    type: 'string',
+    defaultValue: 'roaring',
+    suggestions: ['roaring', 'concise'],
+    info: <>Compression format for bitmap indexes.</>,
+  },
+  {
+    name: 'bitmap.compressRunOnSerialization',
+    label: 'Bitmap compress run on serialization',
+    type: 'boolean',
+    defaultValue: true,
+    defined: spec => (deepGet(spec, 'bitmap.type') || 'roaring') === 'roaring',
+    info: (
+      <>
+        Controls whether or not run-length encoding will be used when it is determined to be more
+        space-efficient.
+      </>
+    ),
+  },
+
+  {
+    name: 'dimensionCompression',
+    type: 'string',
+    defaultValue: 'lz4',
+    suggestions: ['lz4', 'lzf', 'zstd', 'uncompressed'],
+    info: <>Compression format for dimension columns.</>,
+  },
+
+  {
+    name: 'longEncoding',
+    type: 'string',
+    defaultValue: 'longs',
+    suggestions: ['longs', 'auto'],
+    info: (
+      <>
+        Encoding format for long-typed columns. Applies regardless of whether they are dimensions or
+        metrics. <Code>auto</Code> encodes the values using offset or lookup table depending on
+        column cardinality, and store them with variable size. <Code>longs</Code> stores the value
+        as-is with 8 bytes each.
+      </>
+    ),
+  },
+  {
+    name: 'metricCompression',
+    type: 'string',
+    defaultValue: 'lz4',
+    suggestions: ['lz4', 'lzf', 'zstd', 'uncompressed'],
+    info: <>Compression format for primitive type metric columns.</>,
+  },
+
+  {
+    name: 'jsonCompression',
+    label: 'JSON compression',
+    type: 'string',
+    defaultValue: 'lz4',
+    suggestions: ['lz4', 'lzf', 'zstd', 'uncompressed'],
+    info: <>Compression format to use for nested column raw data. </>,
+  },
+];
diff --git a/web-console/src/druid-models/index.ts b/web-console/src/druid-models/index.ts
index 359ba70440b8..0b4ad6b65f70 100644
--- a/web-console/src/druid-models/index.ts
+++ b/web-console/src/druid-models/index.ts
@@ -25,6 +25,7 @@ export * from './execution/execution';
 export * from './external-config/external-config';
 export * from './filter/filter';
 export * from './flatten-spec/flatten-spec';
+export * from './index-spec/index-spec';
 export * from './ingest-query-pattern/ingest-query-pattern';
 export * from './ingestion-spec/ingestion-spec';
 export * from './input-format/input-format';
diff --git a/web-console/src/druid-models/ingest-query-pattern/ingest-query-pattern.ts b/web-console/src/druid-models/ingest-query-pattern/ingest-query-pattern.ts
index f4dee926b606..7bdcaae50ab2 100644
--- a/web-console/src/druid-models/ingest-query-pattern/ingest-query-pattern.ts
+++ b/web-console/src/druid-models/ingest-query-pattern/ingest-query-pattern.ts
@@ -63,6 +63,7 @@ export function externalConfigToIngestQueryPattern(
   config: ExternalConfig,
   isArrays: boolean[],
   timeExpression: SqlExpression | undefined,
+  partitionedByHint: string | undefined,
 ): IngestQueryPattern {
   return {
     destinationTableName: guessDataSourceNameFromInputSource(config.inputSource) || 'data',
@@ -71,7 +72,7 @@ export function externalConfigToIngestQueryPattern(
     mainExternalConfig: config,
     filters: [],
     dimensions: externalConfigToInitDimensions(config, isArrays, timeExpression),
-    partitionedBy: timeExpression ? 'day' : 'all',
+    partitionedBy: partitionedByHint || (timeExpression ? 'day' : 'all'),
     clusteredBy: [],
   };
 }
diff --git a/web-console/src/druid-models/ingestion-spec/ingestion-spec.tsx b/web-console/src/druid-models/ingestion-spec/ingestion-spec.tsx
index b68052abd471..f144f4c2ad29 100644
--- a/web-console/src/druid-models/ingestion-spec/ingestion-spec.tsx
+++ b/web-console/src/druid-models/ingestion-spec/ingestion-spec.tsx
@@ -21,6 +21,7 @@ import { range } from 'd3-array';
 import React from 'react';
 
 import { AutoForm, ExternalLink, Field } from '../../components';
+import { IndexSpecDialog } from '../../dialogs/index-spec-dialog/index-spec-dialog';
 import { getLink } from '../../links';
 import {
   allowKeys,
@@ -44,6 +45,7 @@ import {
   getDimensionSpecs,
   getDimensionSpecType,
 } from '../dimension-spec/dimension-spec';
+import { IndexSpec, summarizeIndexSpec } from '../index-spec/index-spec';
 import { InputFormat, issueWithInputFormat } from '../input-format/input-format';
 import {
   FILTER_SUGGESTIONS,
@@ -1379,6 +1381,7 @@ export interface TuningConfig {
   partitionsSpec?: PartitionsSpec;
   maxPendingPersists?: number;
   indexSpec?: IndexSpec;
+  indexSpecForIntermediatePersists?: IndexSpec;
   forceExtendableShardSpecs?: boolean;
   forceGuaranteedRollup?: boolean;
   reportParseExceptions?: boolean;
@@ -1869,103 +1872,38 @@ const TUNING_FORM_FIELDS: Field<IngestionSpec>[] = [
   },
 
   {
-    name: 'spec.tuningConfig.indexSpec.bitmap.type',
-    label: 'Index bitmap type',
-    type: 'string',
-    defaultValue: 'roaring',
-    suggestions: ['concise', 'roaring'],
+    name: 'spec.tuningConfig.indexSpec',
+    type: 'custom',
     hideInMore: true,
-    info: <>Compression format for bitmap indexes.</>,
-  },
-  {
-    name: 'spec.tuningConfig.indexSpec.bitmap.compressRunOnSerialization',
-    type: 'boolean',
-    defaultValue: true,
-    defined: spec => deepGet(spec, 'spec.tuningConfig.indexSpec.bitmap.type') === 'roaring',
-    info: (
-      <>
-        Controls whether or not run-length encoding will be used when it is determined to be more
-        space-efficient.
-      </>
+    info: <>Defines segment storage format options to use at indexing time.</>,
+    placeholder: 'Default index spec',
+    customSummary: summarizeIndexSpec,
+    customDialog: ({ value, onValueChange, onClose }) => (
+      <IndexSpecDialog onClose={onClose} onSave={onValueChange} indexSpec={value} />
     ),
   },
-
-  {
-    name: 'spec.tuningConfig.indexSpec.dimensionCompression',
-    label: 'Index dimension compression',
-    type: 'string',
-    defaultValue: 'lz4',
-    suggestions: ['lz4', 'lzf', 'zstd', 'uncompressed'],
-    hideInMore: true,
-    info: <>Compression format for dimension columns.</>,
-  },
-
   {
-    name: 'spec.tuningConfig.indexSpec.stringDictionaryEncoding.type',
-    label: 'Index string dictionary encoding',
-    type: 'string',
-    defaultValue: 'utf8',
-    suggestions: ['utf8', 'frontCoded'],
+    name: 'spec.tuningConfig.indexSpecForIntermediatePersists',
+    type: 'custom',
     hideInMore: true,
     info: (
       <>
-        Encoding format for STRING value dictionaries used by STRING and COMPLEX&lt;json&gt;
-        columns.
+        Defines segment storage format options to use at indexing time for intermediate persisted
+        temporary segments.
       </>
     ),
-  },
-  {
-    name: 'spec.tuningConfig.indexSpec.stringDictionaryEncoding.bucketSize',
-    label: 'Index string dictionary encoding bucket size',
-    type: 'number',
-    defaultValue: 4,
-    min: 1,
-    max: 128,
-    defined: spec =>
-      deepGet(spec, 'spec.tuningConfig.indexSpec.stringDictionaryEncoding.type') === 'frontCoded',
-    hideInMore: true,
-    info: (
-      <>
-        The number of values to place in a bucket to perform delta encoding. Must be a power of 2,
-        maximum is 128.
-      </>
+    placeholder: 'Default index spec',
+    customSummary: summarizeIndexSpec,
+    customDialog: ({ value, onValueChange, onClose }) => (
+      <IndexSpecDialog
+        title="Index spec for intermediate persists"
+        onClose={onClose}
+        onSave={onValueChange}
+        indexSpec={value}
+      />
     ),
   },
 
-  {
-    name: 'spec.tuningConfig.indexSpec.metricCompression',
-    label: 'Index metric compression',
-    type: 'string',
-    defaultValue: 'lz4',
-    suggestions: ['lz4', 'lzf', 'zstd', 'uncompressed'],
-    hideInMore: true,
-    info: <>Compression format for primitive type metric columns.</>,
-  },
-  {
-    name: 'spec.tuningConfig.indexSpec.longEncoding',
-    label: 'Index long encoding',
-    type: 'string',
-    defaultValue: 'longs',
-    suggestions: ['longs', 'auto'],
-    hideInMore: true,
-    info: (
-      <>
-        Encoding format for long-typed columns. Applies regardless of whether they are dimensions or
-        metrics. <Code>auto</Code> encodes the values using offset or lookup table depending on
-        column cardinality, and store them with variable size. <Code>longs</Code> stores the value
-        as-is with 8 bytes each.
-      </>
-    ),
-  },
-  {
-    name: 'spec.tuningConfig.indexSpec.jsonCompression',
-    label: 'Index JSON compression',
-    type: 'string',
-    defaultValue: 'lz4',
-    suggestions: ['lz4', 'lzf', 'zstd', 'uncompressed'],
-    hideInMore: true,
-    info: <>Compression format to use for nested column raw data. </>,
-  },
   {
     name: 'spec.tuningConfig.splitHintSpec.maxSplitSize',
     type: 'number',
@@ -2172,18 +2110,6 @@ export function getTuningFormFields() {
   return TUNING_FORM_FIELDS;
 }
 
-export interface IndexSpec {
-  bitmap?: Bitmap;
-  dimensionCompression?: string;
-  metricCompression?: string;
-  longEncoding?: string;
-}
-
-export interface Bitmap {
-  type: string;
-  compressRunOnSerialization?: boolean;
-}
-
 // --------------
 
 export function updateIngestionType(
diff --git a/web-console/src/druid-models/metric-spec/metric-spec.tsx b/web-console/src/druid-models/metric-spec/metric-spec.tsx
index 6b3290272ee9..4295310486c5 100644
--- a/web-console/src/druid-models/metric-spec/metric-spec.tsx
+++ b/web-console/src/druid-models/metric-spec/metric-spec.tsx
@@ -78,6 +78,7 @@ export const METRIC_SPEC_FIELDS: Field<MetricSpec>[] = [
       // Should the first / last aggregators become usable at ingestion time, reverse the changes made in:
       // https://github.com/apache/druid/pull/10794
       'thetaSketch',
+      'arrayOfDoublesSketch',
       {
         group: 'HLLSketch',
         suggestions: ['HLLSketchBuild', 'HLLSketchMerge'],
@@ -104,6 +105,7 @@ export const METRIC_SPEC_FIELDS: Field<MetricSpec>[] = [
       'doubleMax',
       'floatMax',
       'thetaSketch',
+      'arrayOfDoublesSketch',
       'HLLSketchBuild',
       'HLLSketchMerge',
       'quantilesDoublesSketch',
@@ -178,6 +180,47 @@ export const METRIC_SPEC_FIELDS: Field<MetricSpec>[] = [
       </>
     ),
   },
+  // arrayOfDoublesSketch
+  {
+    name: 'nominalEntries',
+    type: 'number',
+    defined: typeIs('arrayOfDoublesSketch'),
+    defaultValue: 16384,
+    info: (
+      <>
+        <p>
+          Parameter that determines the accuracy and size of the sketch. Higher k means higher
+          accuracy but more space to store sketches.
+        </p>
+        <p>Must be a power of 2.</p>
+        <p>
+          See the{' '}
+          <ExternalLink href="https://datasketches.apache.org/docs/Theta/ThetaErrorTable">
+            Theta sketch accuracy
+          </ExternalLink>{' '}
+          for details.
+        </p>
+      </>
+    ),
+  },
+  {
+    name: 'metricColumns',
+    type: 'string-array',
+    defined: typeIs('arrayOfDoublesSketch'),
+    info: (
+      <>
+        If building sketches from raw data, an array of names of the input columns containing
+        numeric values to be associated with each distinct key.
+      </>
+    ),
+  },
+  {
+    name: 'numberOfValues',
+    type: 'number',
+    defined: typeIs('arrayOfDoublesSketch'),
+    placeholder: 'metricColumns length or 1',
+    info: <>Number of values associated with each distinct key.</>,
+  },
   // HLLSketchBuild & HLLSketchMerge
   {
     name: 'lgK',
diff --git a/web-console/src/druid-models/workbench-query/workbench-query-part.ts b/web-console/src/druid-models/workbench-query/workbench-query-part.ts
index 604cfb013213..5e4afb453f09 100644
--- a/web-console/src/druid-models/workbench-query/workbench-query-part.ts
+++ b/web-console/src/druid-models/workbench-query/workbench-query-part.ts
@@ -62,10 +62,10 @@ export class WorkbenchQueryPart {
   static getIngestDatasourceFromQueryFragment(queryFragment: string): string | undefined {
     // Assuming the queryFragment is no parsable find the prefix that look like:
     // REPLACE<space>INTO<space><whatever><space>SELECT<space or EOF>
-    const matchInsertReplaceIndex = queryFragment.match(/(?:INSERT|REPLACE)\s+INTO/)?.index;
+    const matchInsertReplaceIndex = queryFragment.match(/(?:INSERT|REPLACE)\s+INTO/i)?.index;
     if (typeof matchInsertReplaceIndex !== 'number') return;
 
-    const matchEnd = queryFragment.match(/\b(?:SELECT|WITH)\b|$/);
+    const matchEnd = queryFragment.match(/\b(?:SELECT|WITH)\b|$/i);
     const fragmentQuery = SqlQuery.maybeParse(
       queryFragment.substring(matchInsertReplaceIndex, matchEnd?.index) + ' SELECT * FROM t',
     );
diff --git a/web-console/src/druid-models/workbench-query/workbench-query.spec.ts b/web-console/src/druid-models/workbench-query/workbench-query.spec.ts
index 5d7e2615098c..9af0fb240700 100644
--- a/web-console/src/druid-models/workbench-query/workbench-query.spec.ts
+++ b/web-console/src/druid-models/workbench-query/workbench-query.spec.ts
@@ -465,7 +465,7 @@ describe('WorkbenchQuery', () => {
     it('works with INSERT (unparsable)', () => {
       const sql = sane`
         -- Some comment
-        INSERT INTO trips2
+        INSERT into trips2
         SELECT
           TIME_PARSE(pickup_datetime) AS __time,
           *
diff --git a/web-console/src/druid-models/workbench-query/workbench-query.ts b/web-console/src/druid-models/workbench-query/workbench-query.ts
index 36c71cb07a82..b6a1f74aa107 100644
--- a/web-console/src/druid-models/workbench-query/workbench-query.ts
+++ b/web-console/src/druid-models/workbench-query/workbench-query.ts
@@ -82,13 +82,19 @@ export class WorkbenchQuery {
     externalConfig: ExternalConfig,
     isArrays: boolean[],
     timeExpression: SqlExpression | undefined,
+    partitionedByHint: string | undefined,
   ): WorkbenchQuery {
     return new WorkbenchQuery({
       queryContext: {},
       queryParts: [
         WorkbenchQueryPart.fromQueryString(
           ingestQueryPatternToQuery(
-            externalConfigToIngestQueryPattern(externalConfig, isArrays, timeExpression),
+            externalConfigToIngestQueryPattern(
+              externalConfig,
+              isArrays,
+              timeExpression,
+              partitionedByHint,
+            ),
           ).toString(),
         ),
       ],
diff --git a/web-console/src/helpers/execution/sql-task-execution.ts b/web-console/src/helpers/execution/sql-task-execution.ts
index e7f7250c535f..358eee25c56e 100644
--- a/web-console/src/helpers/execution/sql-task-execution.ts
+++ b/web-console/src/helpers/execution/sql-task-execution.ts
@@ -124,9 +124,14 @@ export async function reattachTaskExecution(
   option: ReattachTaskQueryOptions,
 ): Promise<Execution | IntermediateQueryState<Execution>> {
   const { id, cancelToken, preserveOnTermination } = option;
-  let execution = await getTaskExecution(id, undefined, cancelToken);
+  let execution: Execution;
 
-  execution = await updateExecutionWithDatasourceExistsIfNeeded(execution, cancelToken);
+  try {
+    execution = await getTaskExecution(id, undefined, cancelToken);
+    execution = await updateExecutionWithDatasourceExistsIfNeeded(execution, cancelToken);
+  } catch (e) {
+    throw new Error(`Reattaching to query failed due to: ${e.message}`);
+  }
 
   if (execution.isFullyComplete()) return execution;
 
diff --git a/web-console/src/helpers/spec-conversion.spec.ts b/web-console/src/helpers/spec-conversion.spec.ts
index 0239da185415..2f6aa59f51e2 100644
--- a/web-console/src/helpers/spec-conversion.spec.ts
+++ b/web-console/src/helpers/spec-conversion.spec.ts
@@ -106,6 +106,9 @@ describe('spec conversion', () => {
             partitionDimension: 'isRobot',
             targetRowsPerSegment: 150000,
           },
+          indexSpec: {
+            dimensionCompression: 'lzf',
+          },
           forceGuaranteedRollup: true,
           maxNumConcurrentSubTasks: 4,
           maxParseExceptions: 3,
@@ -159,6 +162,9 @@ describe('spec conversion', () => {
       maxParseExceptions: 3,
       finalizeAggregations: false,
       maxNumTasks: 5,
+      indexSpec: {
+        dimensionCompression: 'lzf',
+      },
     });
   });
 
diff --git a/web-console/src/helpers/spec-conversion.ts b/web-console/src/helpers/spec-conversion.ts
index d35433917f59..9b76e787dd61 100644
--- a/web-console/src/helpers/spec-conversion.ts
+++ b/web-console/src/helpers/spec-conversion.ts
@@ -70,6 +70,11 @@ export function convertSpecToSql(spec: any): QueryWithContext {
     groupByEnableMultiValueUnnesting: false,
   };
 
+  const indexSpec = deepGet(spec, 'spec.tuningConfig.indexSpec');
+  if (indexSpec) {
+    context.indexSpec = indexSpec;
+  }
+
   const lines: string[] = [];
 
   const rollup = deepGet(spec, 'spec.dataSchema.granularitySpec.rollup') ?? true;
diff --git a/web-console/src/links.ts b/web-console/src/links.ts
index d9bd341d4f67..33b58a8acc38 100644
--- a/web-console/src/links.ts
+++ b/web-console/src/links.ts
@@ -84,7 +84,7 @@ export function getLink(linkName: LinkNames): string {
     case 'DOCS_API':
       return `${links.docsHref}/operations/api-reference.html`;
     case 'DOCS_MSQ_ERROR':
-      return `${links.docsHref}/multi-stage-query/concepts.html#error-codes`;
+      return `${links.docsHref}/multi-stage-query/reference.html`;
     case 'COMMUNITY':
       return links.communityHref;
     case 'SLACK':
diff --git a/web-console/src/react-table/react-table-extra.scss b/web-console/src/react-table/react-table-extra.scss
index d87c25c84d8a..bdeecf5e964a 100644
--- a/web-console/src/react-table/react-table-extra.scss
+++ b/web-console/src/react-table/react-table-extra.scss
@@ -45,4 +45,8 @@
       }
     }
   }
+
+  .default-aggregated {
+    padding: 10px 5px;
+  }
 }
diff --git a/web-console/src/variables.scss b/web-console/src/variables.scss
index 1dc4d0124cf3..fec32add0008 100644
--- a/web-console/src/variables.scss
+++ b/web-console/src/variables.scss
@@ -25,7 +25,7 @@ $view-control-bar-height: 30px;
 $standard-padding: 15px;
 $thin-padding: 10px;
 
-// various style variables
+// various style Variables
 
 $druid-brand: #2ceefb;
 $druid-brand2: #00b6bf;
diff --git a/web-console/src/views/datasources-view/__snapshots__/datasources-view.spec.tsx.snap b/web-console/src/views/datasources-view/__snapshots__/datasources-view.spec.tsx.snap
index c48713eff201..9bb9c16fef4a 100644
--- a/web-console/src/views/datasources-view/__snapshots__/datasources-view.spec.tsx.snap
+++ b/web-console/src/views/datasources-view/__snapshots__/datasources-view.spec.tsx.snap
@@ -283,7 +283,7 @@ exports[`DatasourcesView matches snapshot 1`] = `
           "filterable": false,
           "id": "compactionStatus",
           "show": true,
-          "width": 150,
+          "width": 180,
         },
         Object {
           "Cell": [Function],
diff --git a/web-console/src/views/datasources-view/datasources-view.tsx b/web-console/src/views/datasources-view/datasources-view.tsx
index 7f384fc8bc2a..38b85388d269 100644
--- a/web-console/src/views/datasources-view/datasources-view.tsx
+++ b/web-console/src/views/datasources-view/datasources-view.tsx
@@ -36,12 +36,18 @@ import {
   TableColumnSelector,
   ViewControlBar,
 } from '../../components';
-import { AsyncActionDialog, CompactionDialog, RetentionDialog } from '../../dialogs';
+import {
+  AsyncActionDialog,
+  CompactionDialog,
+  KillDatasourceDialog,
+  RetentionDialog,
+} from '../../dialogs';
 import { DatasourceTableActionDialog } from '../../dialogs/datasource-table-action-dialog/datasource-table-action-dialog';
 import {
   CompactionConfig,
+  CompactionInfo,
   CompactionStatus,
-  formatCompactionConfigAndStatus,
+  formatCompactionInfo,
   QueryWithContext,
   zeroCompactionStatus,
 } from '../../druid-models';
@@ -208,9 +214,8 @@ function segmentGranularityCountsToRank(row: DatasourceQueryResultRow): number {
 }
 
 interface Datasource extends DatasourceQueryResultRow {
-  readonly rules: Rule[];
-  readonly compactionConfig?: CompactionConfig;
-  readonly compactionStatus?: CompactionStatus;
+  readonly rules?: Rule[];
+  readonly compaction?: CompactionInfo;
   readonly unused?: boolean;
 }
 
@@ -220,7 +225,7 @@ function makeUnusedDatasource(datasource: string): Datasource {
 
 interface DatasourcesAndDefaultRules {
   readonly datasources: Datasource[];
-  readonly defaultRules: Rule[];
+  readonly defaultRules?: Rule[];
 }
 
 interface RetentionDialogOpenOn {
@@ -433,43 +438,85 @@ ORDER BY 1`;
 
         let unused: string[] = [];
         if (showUnused) {
-          const unusedResp = await Api.instance.get<string[]>(
-            '/druid/coordinator/v1/metadata/datasources?includeUnused',
+          try {
+            unused = (
+              await Api.instance.get<string[]>(
+                '/druid/coordinator/v1/metadata/datasources?includeUnused',
+              )
+            ).data.filter(d => !seen[d]);
+          } catch {
+            AppToaster.show({
+              icon: IconNames.ERROR,
+              intent: Intent.DANGER,
+              message: 'Could not get the list of unused datasources',
+            });
+          }
+        }
+
+        let rules: Record<string, Rule[]> = {};
+        try {
+          rules = (await Api.instance.get<Record<string, Rule[]>>('/druid/coordinator/v1/rules'))
+            .data;
+        } catch {
+          AppToaster.show({
+            icon: IconNames.ERROR,
+            intent: Intent.DANGER,
+            message: 'Could not get load rules',
+          });
+        }
+
+        let compactionConfigs: Record<string, CompactionConfig> | undefined;
+        try {
+          const compactionConfigsResp = await Api.instance.get<{
+            compactionConfigs: CompactionConfig[];
+          }>('/druid/coordinator/v1/config/compaction');
+          compactionConfigs = lookupBy(
+            compactionConfigsResp.data.compactionConfigs || [],
+            c => c.dataSource,
           );
-          unused = unusedResp.data.filter(d => !seen[d]);
+        } catch {
+          AppToaster.show({
+            icon: IconNames.ERROR,
+            intent: Intent.DANGER,
+            message: 'Could not get compaction configs',
+          });
         }
 
-        const rulesResp = await Api.instance.get<Record<string, Rule[]>>(
-          '/druid/coordinator/v1/rules',
-        );
-        const rules = rulesResp.data;
-
-        const compactionConfigsResp = await Api.instance.get<{
-          compactionConfigs: CompactionConfig[];
-        }>('/druid/coordinator/v1/config/compaction');
-        const compactionConfigs = lookupBy(
-          compactionConfigsResp.data.compactionConfigs || [],
-          c => c.dataSource,
-        );
-
-        const compactionStatusesResp = await Api.instance.get<{ latestStatus: CompactionStatus[] }>(
-          '/druid/coordinator/v1/compaction/status',
-        );
-        const compactionStatuses = lookupBy(
-          compactionStatusesResp.data.latestStatus || [],
-          c => c.dataSource,
-        );
+        let compactionStatuses: Record<string, CompactionStatus> | undefined;
+        if (compactionConfigs) {
+          // Don't bother getting the statuses if we can not even get the configs
+          try {
+            const compactionStatusesResp = await Api.instance.get<{
+              latestStatus: CompactionStatus[];
+            }>('/druid/coordinator/v1/compaction/status');
+            compactionStatuses = lookupBy(
+              compactionStatusesResp.data.latestStatus || [],
+              c => c.dataSource,
+            );
+          } catch {
+            AppToaster.show({
+              icon: IconNames.ERROR,
+              intent: Intent.DANGER,
+              message: 'Could not get compaction statuses',
+            });
+          }
+        }
 
         return {
           datasources: datasources.concat(unused.map(makeUnusedDatasource)).map(ds => {
             return {
               ...ds,
-              rules: rules[ds.datasource] || [],
-              compactionConfig: compactionConfigs[ds.datasource],
-              compactionStatus: compactionStatuses[ds.datasource],
+              rules: rules[ds.datasource],
+              compaction:
+                compactionConfigs && compactionStatuses
+                  ? {
+                      config: compactionConfigs[ds.datasource],
+                      status: compactionStatuses[ds.datasource],
+                    }
+                  : undefined,
             };
           }),
-          defaultRules: rules[DEFAULT_RULES_KEY] || [],
+          defaultRules: rules[DEFAULT_RULES_KEY],
         };
       },
       onStateChange: datasourcesAndDefaultRulesState => {
@@ -633,36 +680,15 @@ ORDER BY 1`;
     if (!killDatasource) return;
 
     return (
-      <AsyncActionDialog
-        action={async () => {
-          const resp = await Api.instance.delete(
-            `/druid/coordinator/v1/datasources/${Api.encodePath(
-              killDatasource,
-            )}?kill=true&interval=1000/3000`,
-            {},
-          );
-          return resp.data;
-        }}
-        confirmButtonText="Permanently delete unused segments"
-        successText="Kill task was issued. Unused segments in datasource will be deleted"
-        failText="Failed submit kill task"
-        intent={Intent.DANGER}
+      <KillDatasourceDialog
+        datasource={killDatasource}
         onClose={() => {
           this.setState({ killDatasource: undefined });
         }}
         onSuccess={() => {
           this.fetchDatasourceData();
         }}
-        warningChecks={[
-          `I understand that this operation will delete all metadata about the unused segments of ${killDatasource} and removes them from deep storage.`,
-          'I understand that this operation cannot be undone.',
-        ]}
-      >
-        <p>
-          {`Are you sure you want to permanently delete unused segments in '${killDatasource}'?`}
-        </p>
-        <p>This action is not reversible and the data deleted will be lost.</p>
-      </AsyncActionDialog>
+      />
     );
   }
 
@@ -756,20 +782,20 @@ ORDER BY 1`;
     this.setState({ retentionDialogOpenOn: undefined });
     setTimeout(() => {
       this.setState(state => {
-        const datasourcesAndDefaultRules = state.datasourcesAndDefaultRulesState.data;
-        if (!datasourcesAndDefaultRules) return {};
+        const defaultRules = state.datasourcesAndDefaultRulesState.data?.defaultRules;
+        if (!defaultRules) return {};
 
         return {
           retentionDialogOpenOn: {
             datasource: '_default',
-            rules: datasourcesAndDefaultRules.defaultRules,
+            rules: defaultRules,
           },
         };
       });
     }, 50);
   };
 
-  private readonly saveCompaction = async (compactionConfig: any) => {
+  private readonly saveCompaction = async (compactionConfig: CompactionConfig) => {
     if (!compactionConfig) return;
     try {
       await Api.instance.post(`/druid/coordinator/v1/config/compaction`, compactionConfig);
@@ -819,8 +845,8 @@ ORDER BY 1`;
   getDatasourceActions(
     datasource: string,
     unused: boolean | undefined,
-    rules: Rule[],
-    compactionConfig: CompactionConfig | undefined,
+    rules: Rule[] | undefined,
+    compactionInfo: CompactionInfo | undefined,
   ): BasicAction[] {
     const { goToQuery, goToTask, capabilities } = this.props;
 
@@ -863,82 +889,83 @@ ORDER BY 1`;
         },
       ];
     } else {
-      return goToActions.concat([
-        {
-          icon: IconNames.AUTOMATIC_UPDATES,
-          title: 'Edit retention rules',
-          onAction: () => {
-            this.setState({
-              retentionDialogOpenOn: {
-                datasource,
-                rules,
-              },
-            });
+      return goToActions.concat(
+        compact([
+          {
+            icon: IconNames.AUTOMATIC_UPDATES,
+            title: 'Edit retention rules',
+            onAction: () => {
+              this.setState({
+                retentionDialogOpenOn: {
+                  datasource,
+                  rules: rules || [],
+                },
+              });
+            },
           },
-        },
-        {
-          icon: IconNames.REFRESH,
-          title: 'Mark as used all segments (will lead to reapplying retention rules)',
-          onAction: () =>
-            this.setState({
-              datasourceToMarkAllNonOvershadowedSegmentsAsUsedIn: datasource,
-            }),
-        },
-        {
-          icon: IconNames.COMPRESSED,
-          title: 'Edit compaction configuration',
-          onAction: () => {
-            this.setState({
-              compactionDialogOpenOn: {
-                datasource,
-                compactionConfig,
-              },
-            });
+          {
+            icon: IconNames.REFRESH,
+            title: 'Mark as used all segments (will lead to reapplying retention rules)',
+            onAction: () =>
+              this.setState({
+                datasourceToMarkAllNonOvershadowedSegmentsAsUsedIn: datasource,
+              }),
           },
-        },
-        {
-          icon: IconNames.EXPORT,
-          title: 'Mark as used segments by interval',
-
-          onAction: () =>
-            this.setState({
-              datasourceToMarkSegmentsByIntervalIn: datasource,
-              useUnuseAction: 'use',
-            }),
-        },
-        {
-          icon: IconNames.IMPORT,
-          title: 'Mark as unused segments by interval',
-
-          onAction: () =>
-            this.setState({
-              datasourceToMarkSegmentsByIntervalIn: datasource,
-              useUnuseAction: 'unuse',
-            }),
-        },
-        {
-          icon: IconNames.IMPORT,
-          title: 'Mark as unused all segments',
-          intent: Intent.DANGER,
-          onAction: () => this.setState({ datasourceToMarkAsUnusedAllSegmentsIn: datasource }),
-        },
-        {
-          icon: IconNames.TRASH,
-          title: 'Delete unused segments (issue kill task)',
-          intent: Intent.DANGER,
-          onAction: () => this.setState({ killDatasource: datasource }),
-        },
-      ]);
+          compactionInfo
+            ? {
+                icon: IconNames.COMPRESSED,
+                title: 'Edit compaction configuration',
+                onAction: () => {
+                  this.setState({
+                    compactionDialogOpenOn: {
+                      datasource,
+                      compactionConfig: compactionInfo.config,
+                    },
+                  });
+                },
+              }
+            : undefined,
+          {
+            icon: IconNames.EXPORT,
+            title: 'Mark as used segments by interval',
+
+            onAction: () =>
+              this.setState({
+                datasourceToMarkSegmentsByIntervalIn: datasource,
+                useUnuseAction: 'use',
+              }),
+          },
+          {
+            icon: IconNames.IMPORT,
+            title: 'Mark as unused segments by interval',
+
+            onAction: () =>
+              this.setState({
+                datasourceToMarkSegmentsByIntervalIn: datasource,
+                useUnuseAction: 'unuse',
+              }),
+          },
+          {
+            icon: IconNames.IMPORT,
+            title: 'Mark as unused all segments',
+            intent: Intent.DANGER,
+            onAction: () => this.setState({ datasourceToMarkAsUnusedAllSegmentsIn: datasource }),
+          },
+          {
+            icon: IconNames.TRASH,
+            title: 'Delete unused segments (issue kill task)',
+            intent: Intent.DANGER,
+            onAction: () => this.setState({ killDatasource: datasource }),
+          },
+        ]),
+      );
     }
   }
 
   private renderRetentionDialog(): JSX.Element | undefined {
     const { retentionDialogOpenOn, tiersState, datasourcesAndDefaultRulesState } = this.state;
-    const { defaultRules } = datasourcesAndDefaultRulesState.data || {
-      datasources: [],
-      defaultRules: [],
-    };
-    if (!retentionDialogOpenOn) return;
+    const defaultRules = datasourcesAndDefaultRulesState.data?.defaultRules;
+    if (!retentionDialogOpenOn || !defaultRules) return;
 
     return (
       <RetentionDialog
@@ -969,11 +996,11 @@ ORDER BY 1`;
   }
 
   private onDetail(datasource: Datasource): void {
-    const { unused, rules, compactionConfig } = datasource;
+    const { unused, rules, compaction } = datasource;
 
     this.setState({
       datasourceTableActionDialogId: datasource.datasource,
-      actions: this.getDatasourceActions(datasource.datasource, unused, rules, compactionConfig),
+      actions: this.getDatasourceActions(datasource.datasource, unused, rules, compaction),
     });
   }
 
@@ -982,9 +1009,7 @@ ORDER BY 1`;
     const { datasourcesAndDefaultRulesState, datasourceFilter, showUnused, visibleColumns } =
       this.state;
 
-    let { datasources, defaultRules } = datasourcesAndDefaultRulesState.data
-      ? datasourcesAndDefaultRulesState.data
-      : { datasources: [], defaultRules: [] };
+    let { datasources, defaultRules } = datasourcesAndDefaultRulesState.data || { datasources: [] };
 
     if (!showUnused) {
       datasources = datasources.filter(d => !d.unused);
@@ -1009,8 +1034,8 @@ ORDER BY 1`;
     const replicatedSizeValues = datasources.map(d => formatReplicatedSize(d.replicated_size));
 
     const leftToBeCompactedValues = datasources.map(d =>
-      d.compactionStatus
-        ? formatLeftToBeCompacted(d.compactionStatus.bytesAwaitingCompaction)
+      d.compaction?.status
+        ? formatLeftToBeCompacted(d.compaction?.status.bytesAwaitingCompaction)
         : '-',
     );
 
@@ -1297,24 +1322,26 @@ ORDER BY 1`;
             Header: 'Compaction',
             show: capabilities.hasCoordinatorAccess() && visibleColumns.shown('Compaction'),
             id: 'compactionStatus',
-            accessor: row => Boolean(row.compactionStatus),
+            accessor: row => Boolean(row.compaction?.status),
             filterable: false,
-            width: 150,
+            width: 180,
             Cell: ({ original }) => {
-              const { datasource, compactionConfig, compactionStatus } = original as Datasource;
+              const { datasource, compaction } = original as Datasource;
               return (
                 <TableClickableCell
-                  onClick={() =>
+                  disabled={!compaction}
+                  onClick={() => {
+                    if (!compaction) return;
                     this.setState({
                       compactionDialogOpenOn: {
                         datasource,
-                        compactionConfig,
+                        compactionConfig: compaction.config,
                       },
-                    })
-                  }
+                    });
+                  }}
                   hoverIcon={IconNames.EDIT}
                 >
-                  {formatCompactionConfigAndStatus(compactionConfig, compactionStatus)}
+                  {compaction ? formatCompactionInfo(compaction) : 'Could not get compaction info'}
                 </TableClickableCell>
               );
             },
@@ -1324,17 +1351,22 @@ ORDER BY 1`;
             show: capabilities.hasCoordinatorAccess() && visibleColumns.shown('% Compacted'),
             id: 'percentCompacted',
             width: 200,
-            accessor: ({ compactionStatus }) =>
-              compactionStatus && compactionStatus.bytesCompacted
-                ? compactionStatus.bytesCompacted /
-                  (compactionStatus.bytesAwaitingCompaction + compactionStatus.bytesCompacted)
-                : 0,
+            accessor: ({ compaction }) => {
+              const status = compaction?.status;
+              return status?.bytesCompacted
+                ? status.bytesCompacted / (status.bytesAwaitingCompaction + status.bytesCompacted)
+                : 0;
+            },
             filterable: false,
             className: 'padded',
             Cell: ({ original }) => {
-              const { compactionStatus } = original as Datasource;
+              const { compaction } = original as Datasource;
+              if (!compaction) {
+                return 'Could not get compaction info';
+              }
 
-              if (!compactionStatus || zeroCompactionStatus(compactionStatus)) {
+              const { status } = compaction;
+              if (!status || zeroCompactionStatus(status)) {
                 return (
                   <>
                     <BracedText text="-" braces={PERCENT_BRACES} /> &nbsp;{' '}
@@ -1348,20 +1380,14 @@ ORDER BY 1`;
                 <>
                   <BracedText
                     text={formatPercent(
-                      progress(
-                        compactionStatus.bytesCompacted,
-                        compactionStatus.bytesAwaitingCompaction,
-                      ),
+                      progress(status.bytesCompacted, status.bytesAwaitingCompaction),
                     )}
                     braces={PERCENT_BRACES}
                   />{' '}
                   &nbsp;{' '}
                   <BracedText
                     text={formatPercent(
-                      progress(
-                        compactionStatus.segmentCountCompacted,
-                        compactionStatus.segmentCountAwaitingCompaction,
-                      ),
+                      progress(status.segmentCountCompacted, status.segmentCountAwaitingCompaction),
                     )}
                     braces={PERCENT_BRACES}
                   />{' '}
@@ -1369,8 +1395,8 @@ ORDER BY 1`;
                   <BracedText
                     text={formatPercent(
                       progress(
-                        compactionStatus.intervalCountCompacted,
-                        compactionStatus.intervalCountAwaitingCompaction,
+                        status.intervalCountCompacted,
+                        status.intervalCountAwaitingCompaction,
                       ),
                     )}
                     braces={PERCENT_BRACES}
@@ -1385,20 +1411,26 @@ ORDER BY 1`;
               capabilities.hasCoordinatorAccess() && visibleColumns.shown('Left to be compacted'),
             id: 'leftToBeCompacted',
             width: 100,
-            accessor: ({ compactionStatus }) =>
-              (compactionStatus && compactionStatus.bytesAwaitingCompaction) || 0,
+            accessor: ({ compaction }) => {
+              const status = compaction?.status;
+              return status?.bytesAwaitingCompaction || 0;
+            },
             filterable: false,
             className: 'padded',
             Cell: ({ original }) => {
-              const { compactionStatus } = original as Datasource;
+              const { compaction } = original as Datasource;
+              if (!compaction) {
+                return 'Could not get compaction info';
+              }
 
-              if (!compactionStatus) {
+              const { status } = compaction;
+              if (!status) {
                 return <BracedText text="-" braces={leftToBeCompactedValues} />;
               }
 
               return (
                 <BracedText
-                  text={formatLeftToBeCompacted(compactionStatus.bytesAwaitingCompaction)}
+                  text={formatLeftToBeCompacted(status.bytesAwaitingCompaction)}
                   braces={leftToBeCompactedValues}
                 />
               );
@@ -1408,26 +1440,30 @@ ORDER BY 1`;
             Header: 'Retention',
             show: capabilities.hasCoordinatorAccess() && visibleColumns.shown('Retention'),
             id: 'retention',
-            accessor: row => row.rules.length,
+            accessor: row => row.rules?.length || 0,
             filterable: false,
             width: 200,
             Cell: ({ original }) => {
               const { datasource, rules } = original as Datasource;
               return (
                 <TableClickableCell
-                  onClick={() =>
+                  disabled={!defaultRules}
+                  onClick={() => {
+                    if (!defaultRules) return;
                     this.setState({
                       retentionDialogOpenOn: {
                         datasource,
-                        rules,
+                        rules: rules || [],
                       },
-                    })
-                  }
+                    });
+                  }}
                   hoverIcon={IconNames.EDIT}
                 >
-                  {rules.length
+                  {rules?.length
                     ? DatasourcesView.formatRules(rules)
-                    : `Cluster default: ${DatasourcesView.formatRules(defaultRules)}`}
+                    : defaultRules
+                    ? `Cluster default: ${DatasourcesView.formatRules(defaultRules)}`
+                    : 'Could not get default rules'}
                 </TableClickableCell>
               );
             },
@@ -1440,12 +1476,12 @@ ORDER BY 1`;
             width: ACTION_COLUMN_WIDTH,
             filterable: false,
             Cell: ({ value: datasource, original }) => {
-              const { unused, rules, compactionConfig } = original as Datasource;
+              const { unused, rules, compaction } = original as Datasource;
               const datasourceActions = this.getDatasourceActions(
                 datasource,
                 unused,
                 rules,
-                compactionConfig,
+                compaction,
               );
               return (
                 <ActionCell
diff --git a/web-console/src/views/ingestion-view/ingestion-view.tsx b/web-console/src/views/ingestion-view/ingestion-view.tsx
index e25d9be28def..e350ad498578 100644
--- a/web-console/src/views/ingestion-view/ingestion-view.tsx
+++ b/web-console/src/views/ingestion-view/ingestion-view.tsx
@@ -917,7 +917,8 @@ ORDER BY
             width: 80,
             filterable: false,
             className: 'padded',
-            Cell({ value, original }) {
+            Cell({ value, original, aggregated }) {
+              if (aggregated) return '';
               if (value > 0) {
                 return formatDuration(value);
               }
diff --git a/web-console/src/views/services-view/services-view.tsx b/web-console/src/views/services-view/services-view.tsx
index aa2a934533e7..9dff93c8ab7d 100644
--- a/web-console/src/views/services-view/services-view.tsx
+++ b/web-console/src/views/services-view/services-view.tsx
@@ -36,11 +36,12 @@ import {
 import { AsyncActionDialog } from '../../dialogs';
 import { QueryWithContext } from '../../druid-models';
 import { STANDARD_TABLE_PAGE_SIZE, STANDARD_TABLE_PAGE_SIZE_OPTIONS } from '../../react-table';
-import { Api } from '../../singletons';
+import { Api, AppToaster } from '../../singletons';
 import {
   Capabilities,
   CapabilitiesMode,
   deepGet,
+  filterMap,
   formatBytes,
   formatBytesCompact,
   hasPopoverOpen,
@@ -117,7 +118,7 @@ export interface ServicesViewState {
   visibleColumns: LocalStorageBackedVisibility;
 }
 
-interface ServiceQueryResultRow {
+interface ServiceResultRow {
   readonly service: string;
   readonly service_type: string;
   readonly tier: string;
@@ -127,16 +128,18 @@ interface ServiceQueryResultRow {
   readonly max_size: NumberLike;
   readonly plaintext_port: number;
   readonly tls_port: number;
+  loadQueueInfo?: LoadQueueInfo;
+  workerInfo?: WorkerInfo;
 }
 
-interface LoadQueueStatus {
+interface LoadQueueInfo {
   readonly segmentsToDrop: NumberLike;
   readonly segmentsToDropSize: NumberLike;
   readonly segmentsToLoad: NumberLike;
   readonly segmentsToLoadSize: NumberLike;
 }
 
-interface MiddleManagerQueryResultRow {
+interface WorkerInfo {
   readonly availabilityGroups: string[];
   readonly blacklistedUntil: string | null;
   readonly currCapacityUsed: NumberLike;
@@ -153,11 +156,6 @@ interface MiddleManagerQueryResultRow {
   };
 }
 
-interface ServiceResultRow
-  extends ServiceQueryResultRow,
-    Partial<LoadQueueStatus>,
-    Partial<MiddleManagerQueryResultRow> {}
-
 export class ServicesView extends React.PureComponent<ServicesViewProps, ServicesViewState> {
   private readonly serviceQueryManager: QueryManager<Capabilities, ServiceResultRow[]>;
 
@@ -198,7 +196,7 @@ ORDER BY
   ) DESC,
   "service" DESC`;
 
-  static async getServices(): Promise<ServiceQueryResultRow[]> {
+  static async getServices(): Promise<ServiceResultRow[]> {
     const allServiceResp = await Api.instance.get('/druid/coordinator/v1/servers?simple');
     const allServices = allServiceResp.data;
     return allServices.map((s: any) => {
@@ -228,7 +226,7 @@ ORDER BY
 
     this.serviceQueryManager = new QueryManager({
       processQuery: async capabilities => {
-        let services: ServiceQueryResultRow[];
+        let services: ServiceResultRow[];
         if (capabilities.hasSql()) {
           services = await queryDruidSql({ query: ServicesView.SERVICE_SQL });
         } else if (capabilities.hasCoordinatorAccess()) {
@@ -238,50 +236,49 @@ ORDER BY
         }
 
         if (capabilities.hasCoordinatorAccess()) {
-          const loadQueueResponse = await Api.instance.get(
-            '/druid/coordinator/v1/loadqueue?simple',
-          );
-          const loadQueues: Record<string, LoadQueueStatus> = loadQueueResponse.data;
-          services = services.map(s => {
-            const loadQueueInfo = loadQueues[s.service];
-            if (loadQueueInfo) {
-              s = { ...s, ...loadQueueInfo };
-            }
-            return s;
-          });
+          try {
+            const loadQueueInfos = (
+              await Api.instance.get<Record<string, LoadQueueInfo>>(
+                '/druid/coordinator/v1/loadqueue?simple',
+              )
+            ).data;
+            services.forEach(s => {
+              s.loadQueueInfo = loadQueueInfos[s.service];
+            });
+          } catch {
+            AppToaster.show({
+              icon: IconNames.ERROR,
+              intent: Intent.DANGER,
+              message: 'There was an error getting the load queue info',
+            });
+          }
         }
 
         if (capabilities.hasOverlordAccess()) {
-          let middleManagers: MiddleManagerQueryResultRow[];
           try {
-            const middleManagerResponse = await Api.instance.get('/druid/indexer/v1/workers');
-            middleManagers = middleManagerResponse.data;
+            const workerInfos = (await Api.instance.get<WorkerInfo[]>('/druid/indexer/v1/workers'))
+              .data;
+
+            const workerInfoLookup: Record<string, WorkerInfo> = lookupBy(
+              workerInfos,
+              m => m.worker?.host,
+            );
+
+            services.forEach(s => {
+              s.workerInfo = workerInfoLookup[s.service];
+            });
           } catch (e) {
+            // Swallow this error because it simply a reflection of a local task runner.
             if (
-              e.response &&
-              typeof e.response.data === 'object' &&
-              e.response.data.error === 'Task Runner does not support worker listing'
+              deepGet(e, 'response.data.error') !== 'Task Runner does not support worker listing'
             ) {
-              // Swallow this error because it simply a reflection of a local task runner.
-              middleManagers = [];
-            } else {
-              // Otherwise re-throw.
-              throw e;
+              AppToaster.show({
+                icon: IconNames.ERROR,
+                intent: Intent.DANGER,
+                message: 'There was an error getting the worker info',
+              });
             }
           }
-
-          const middleManagersLookup: Record<string, MiddleManagerQueryResultRow> = lookupBy(
-            middleManagers,
-            m => m.worker.host,
-          );
-
-          services = services.map(s => {
-            const middleManagerInfo = middleManagersLookup[s.service];
-            if (middleManagerInfo) {
-              s = { ...s, ...middleManagerInfo };
-            }
-            return s;
-          });
         }
 
         return services;
@@ -372,7 +369,8 @@ ORDER BY
             id: 'tier',
             width: 180,
             accessor: row => {
-              return row.tier ? row.tier : row.worker ? row.worker.category : null;
+              if (row.tier) return row.tier;
+              return deepGet(row, 'workerInfo.worker.category');
             },
             Cell: this.renderFilterableCell('tier'),
           },
@@ -451,9 +449,11 @@ ORDER BY
             className: 'padded',
             accessor: row => {
               if (oneOf(row.service_type, 'middle_manager', 'indexer')) {
-                return row.worker
-                  ? (Number(row.currCapacityUsed) || 0) / Number(row.worker.capacity)
-                  : null;
+                const { workerInfo } = row;
+                if (!workerInfo) return 0;
+                return (
+                  (Number(workerInfo.currCapacityUsed) || 0) / Number(workerInfo.worker?.capacity)
+                );
               } else {
                 return row.max_size ? Number(row.curr_size) / Number(row.max_size) : null;
               }
@@ -469,15 +469,21 @@ ORDER BY
 
                 case 'indexer':
                 case 'middle_manager': {
-                  const originalMiddleManagers: ServiceResultRow[] = row.subRows.map(
-                    r => r._original,
+                  const workerInfos: WorkerInfo[] = filterMap(
+                    row.subRows,
+                    r => r._original.workerInfo,
                   );
+
+                  if (!workerInfos.length) {
+                    return 'Could not get worker infos';
+                  }
+
                   const totalCurrCapacityUsed = sum(
-                    originalMiddleManagers,
-                    s => Number(s.currCapacityUsed) || 0,
+                    workerInfos,
+                    w => Number(w.currCapacityUsed) || 0,
                   );
                   const totalWorkerCapacity = sum(
-                    originalMiddleManagers,
+                    workerInfos,
                     s => deepGet(s, 'worker.capacity') || 0,
                   );
                   return `${totalCurrCapacityUsed} / ${totalWorkerCapacity} (total slots)`;
@@ -496,8 +502,12 @@ ORDER BY
 
                 case 'indexer':
                 case 'middle_manager': {
-                  const currCapacityUsed = deepGet(row, 'original.currCapacityUsed') || 0;
-                  const capacity = deepGet(row, 'original.worker.capacity');
+                  if (!deepGet(row, 'original.workerInfo')) {
+                    return 'Could not get capacity info';
+                  }
+                  const currCapacityUsed =
+                    deepGet(row, 'original.workerInfo.currCapacityUsed') || 0;
+                  const capacity = deepGet(row, 'original.workerInfo.worker.capacity');
                   if (typeof capacity === 'number') {
                     return `Slots used: ${currCapacityUsed} of ${capacity}`;
                   } else {
@@ -518,30 +528,58 @@ ORDER BY
             filterable: false,
             className: 'padded',
             accessor: row => {
-              if (oneOf(row.service_type, 'middle_manager', 'indexer')) {
-                if (deepGet(row, 'worker.version') === '') return 'Disabled';
+              switch (row.service_type) {
+                case 'middle_manager':
+                case 'indexer': {
+                  if (deepGet(row, 'worker.version') === '') return 'Disabled';
+                  const { workerInfo } = row;
+                  if (!workerInfo) {
+                    return 'Could not get detail info';
+                  }
 
-                const details: string[] = [];
-                if (row.lastCompletedTaskTime) {
-                  details.push(`Last completed task: ${row.lastCompletedTaskTime}`);
+                  const details: string[] = [];
+                  if (workerInfo.lastCompletedTaskTime) {
+                    details.push(`Last completed task: ${workerInfo.lastCompletedTaskTime}`);
+                  }
+                  if (workerInfo.blacklistedUntil) {
+                    details.push(`Blacklisted until: ${workerInfo.blacklistedUntil}`);
+                  }
+                  return details.join(' ');
                 }
-                if (row.blacklistedUntil) {
-                  details.push(`Blacklisted until: ${row.blacklistedUntil}`);
+
+                case 'coordinator':
+                case 'overlord':
+                  return row.is_leader === 1 ? 'Leader' : '';
+
+                case 'historical': {
+                  const { loadQueueInfo } = row;
+                  if (!loadQueueInfo) return 0;
+                  return (
+                    (Number(loadQueueInfo.segmentsToLoad) || 0) +
+                    (Number(loadQueueInfo.segmentsToDrop) || 0)
+                  );
                 }
-                return details.join(' ');
-              } else if (oneOf(row.service_type, 'coordinator', 'overlord')) {
-                return row.is_leader === 1 ? 'Leader' : '';
-              } else {
-                return (Number(row.segmentsToLoad) || 0) + (Number(row.segmentsToDrop) || 0);
+
+                default:
+                  return 0;
               }
             },
             Cell: row => {
               if (row.aggregated) return '';
               const { service_type } = row.original;
               switch (service_type) {
+                case 'middle_manager':
+                case 'indexer':
+                case 'coordinator':
+                case 'overlord':
+                  return row.value;
+
                 case 'historical': {
+                  const { loadQueueInfo } = row.original;
+                  if (!loadQueueInfo) return 'Could not get load queue info';
+
                   const { segmentsToLoad, segmentsToLoadSize, segmentsToDrop, segmentsToDropSize } =
-                    row.original;
+                    loadQueueInfo;
                   return formatQueues(
                     segmentsToLoad,
                     segmentsToLoadSize,
@@ -550,23 +588,31 @@ ORDER BY
                   );
                 }
 
-                case 'indexer':
-                case 'middle_manager':
-                case 'coordinator':
-                case 'overlord':
-                  return row.value;
-
                 default:
                   return '';
               }
             },
             Aggregated: row => {
               if (row.row._pivotVal !== 'historical') return '';
-              const originals: ServiceResultRow[] = row.subRows.map(r => r._original);
-              const segmentsToLoad = sum(originals, s => Number(s.segmentsToLoad) || 0);
-              const segmentsToLoadSize = sum(originals, s => Number(s.segmentsToLoadSize) || 0);
-              const segmentsToDrop = sum(originals, s => Number(s.segmentsToDrop) || 0);
-              const segmentsToDropSize = sum(originals, s => Number(s.segmentsToDropSize) || 0);
+              const loadQueueInfos: LoadQueueInfo[] = filterMap(
+                row.subRows,
+                r => r._original.loadQueueInfo,
+              );
+
+              if (!loadQueueInfos.length) {
+                return 'Could not get load queue infos';
+              }
+
+              const segmentsToLoad = sum(loadQueueInfos, s => Number(s.segmentsToLoad) || 0);
+              const segmentsToLoadSize = sum(
+                loadQueueInfos,
+                s => Number(s.segmentsToLoadSize) || 0,
+              );
+              const segmentsToDrop = sum(loadQueueInfos, s => Number(s.segmentsToDrop) || 0);
+              const segmentsToDropSize = sum(
+                loadQueueInfos,
+                s => Number(s.segmentsToDropSize) || 0,
+              );
               return formatQueues(
                 segmentsToLoad,
                 segmentsToLoadSize,
@@ -580,13 +626,14 @@ ORDER BY
             show: capabilities.hasOverlordAccess() && visibleColumns.shown(ACTION_COLUMN_LABEL),
             id: ACTION_COLUMN_ID,
             width: ACTION_COLUMN_WIDTH,
-            accessor: row => row.worker,
+            accessor: row => row.workerInfo,
             filterable: false,
             Cell: ({ value, aggregated }) => {
               if (aggregated) return '';
               if (!value) return null;
-              const disabled = value.version === '';
-              const workerActions = this.getWorkerActions(value.host, disabled);
+              const { worker } = value;
+              const disabled = worker.version === '';
+              const workerActions = this.getWorkerActions(worker.host, disabled);
               return <ActionCell actions={workerActions} />;
             },
             Aggregated: () => '',
diff --git a/web-console/src/views/sql-data-loader-view/sql-data-loader-view.tsx b/web-console/src/views/sql-data-loader-view/sql-data-loader-view.tsx
index 23c81d02d213..2b3126372a78 100644
--- a/web-console/src/views/sql-data-loader-view/sql-data-loader-view.tsx
+++ b/web-console/src/views/sql-data-loader-view/sql-data-loader-view.tsx
@@ -151,6 +151,7 @@ export const SqlDataLoaderView = React.memo(function SqlDataLoaderView(
                     { inputSource, inputFormat, signature },
                     isArrays,
                     timeExpression,
+                    undefined,
                   ),
                 ).toString(),
                 queryContext: {
@@ -167,6 +168,7 @@ export const SqlDataLoaderView = React.memo(function SqlDataLoaderView(
                     { inputSource, inputFormat, signature },
                     isArrays,
                     timeExpression,
+                    undefined,
                   ),
                 ).toString(),
               });
diff --git a/web-console/src/views/workbench-view/connect-external-data-dialog/connect-external-data-dialog.tsx b/web-console/src/views/workbench-view/connect-external-data-dialog/connect-external-data-dialog.tsx
index d857d37dbf30..e043cf134045 100644
--- a/web-console/src/views/workbench-view/connect-external-data-dialog/connect-external-data-dialog.tsx
+++ b/web-console/src/views/workbench-view/connect-external-data-dialog/connect-external-data-dialog.tsx
@@ -20,7 +20,7 @@ import { Classes, Dialog } from '@blueprintjs/core';
 import { SqlExpression } from 'druid-query-toolkit';
 import React, { useState } from 'react';
 
-import { ExternalConfig } from '../../../druid-models';
+import { ExternalConfig, InputFormat, InputSource } from '../../../druid-models';
 import { InputFormatStep } from '../input-format-step/input-format-step';
 import { InputSourceStep } from '../input-source-step/input-source-step';
 
@@ -32,20 +32,27 @@ export interface ConnectExternalDataDialogProps {
     config: ExternalConfig,
     isArrays: boolean[],
     timeExpression: SqlExpression | undefined,
+    partitionedByHint: string | undefined,
   ): void;
   onClose(): void;
 }
 
+interface ExternalConfigStep {
+  inputSource?: InputSource;
+  inputFormat?: InputFormat;
+  partitionedByHint?: string;
+}
+
 export const ConnectExternalDataDialog = React.memo(function ConnectExternalDataDialog(
   props: ConnectExternalDataDialogProps,
 ) {
   const { initExternalConfig, onClose, onSetExternalConfig } = props;
 
-  const [externalConfigStep, setExternalConfigStep] = useState<Partial<ExternalConfig>>(
+  const [externalConfigStep, setExternalConfigStep] = useState<ExternalConfigStep>(
     initExternalConfig || {},
   );
 
-  const { inputSource, inputFormat } = externalConfigStep;
+  const { inputSource, inputFormat, partitionedByHint } = externalConfigStep;
 
   return (
     <Dialog
@@ -65,6 +72,7 @@ export const ConnectExternalDataDialog = React.memo(function ConnectExternalData
                 { inputSource, inputFormat, signature },
                 isArrays,
                 timeExpression,
+                partitionedByHint,
               );
               onClose();
             }}
@@ -76,8 +84,8 @@ export const ConnectExternalDataDialog = React.memo(function ConnectExternalData
           <InputSourceStep
             initInputSource={inputSource}
             mode="sampler"
-            onSet={(inputSource, inputFormat) => {
-              setExternalConfigStep({ inputSource, inputFormat });
+            onSet={(inputSource, inputFormat, partitionedByHint) => {
+              setExternalConfigStep({ inputSource, inputFormat, partitionedByHint });
             }}
           />
         )}
diff --git a/web-console/src/views/workbench-view/execution-error-pane/__snapshots__/execution-error-pane.spec.tsx.snap b/web-console/src/views/workbench-view/execution-error-pane/__snapshots__/execution-error-pane.spec.tsx.snap
index de73ea9dc9a7..025c9a294636 100644
--- a/web-console/src/views/workbench-view/execution-error-pane/__snapshots__/execution-error-pane.spec.tsx.snap
+++ b/web-console/src/views/workbench-view/execution-error-pane/__snapshots__/execution-error-pane.spec.tsx.snap
@@ -9,7 +9,7 @@ exports[`ExecutionErrorPane matches snapshot 1`] = `
     className="error-message-text"
   >
     <Memo(ExternalLink)
-      href="https://druid.apache.org/docs/latest/multi-stage-query/concepts.html#error-codes"
+      href="https://druid.apache.org/docs/latest/multi-stage-query/reference.html#error_TooManyWarnings"
     >
       TooManyWarnings
     </Memo(ExternalLink)>
diff --git a/web-console/src/views/workbench-view/execution-error-pane/execution-error-pane.tsx b/web-console/src/views/workbench-view/execution-error-pane/execution-error-pane.tsx
index b0368534cc95..967cea3b0ef3 100644
--- a/web-console/src/views/workbench-view/execution-error-pane/execution-error-pane.tsx
+++ b/web-console/src/views/workbench-view/execution-error-pane/execution-error-pane.tsx
@@ -46,7 +46,9 @@ export const ExecutionErrorPane = React.memo(function ExecutionErrorPane(
       <p className="error-message-text">
         {error.errorCode && (
           <>
-            <ExternalLink href={getLink('DOCS_MSQ_ERROR')}>{error.errorCode}</ExternalLink>
+            <ExternalLink href={`${getLink('DOCS_MSQ_ERROR')}#error_${error.errorCode}`}>
+              {error.errorCode}
+            </ExternalLink>
             {': '}
           </>
         )}
diff --git a/web-console/src/views/workbench-view/input-source-step/example-inputs.ts b/web-console/src/views/workbench-view/input-source-step/example-inputs.ts
index e58dfacca35e..a6ad104c7f49 100644
--- a/web-console/src/views/workbench-view/input-source-step/example-inputs.ts
+++ b/web-console/src/views/workbench-view/input-source-step/example-inputs.ts
@@ -16,15 +16,75 @@
  * limitations under the License.
  */
 
-import { InputSource } from '../../../druid-models';
+import { InputFormat, InputSource } from '../../../druid-models';
 
-export interface ExampleInputSource {
+export interface ExampleInput {
   name: string;
   description: string;
   inputSource: InputSource;
+  inputFormat?: InputFormat;
+  partitionedByHint?: string;
 }
 
-export const EXAMPLE_INPUT_SOURCES: ExampleInputSource[] = [
+const TRIPS_INPUT_FORMAT: InputFormat = {
+  type: 'csv',
+  findColumnsFromHeader: false,
+  columns: [
+    'trip_id',
+    'vendor_id',
+    'pickup_datetime',
+    'dropoff_datetime',
+    'store_and_fwd_flag',
+    'rate_code_id',
+    'pickup_longitude',
+    'pickup_latitude',
+    'dropoff_longitude',
+    'dropoff_latitude',
+    'passenger_count',
+    'trip_distance',
+    'fare_amount',
+    'extra',
+    'mta_tax',
+    'tip_amount',
+    'tolls_amount',
+    'ehail_fee',
+    'improvement_surcharge',
+    'total_amount',
+    'payment_type',
+    'trip_type',
+    'pickup',
+    'dropoff',
+    'cab_type',
+    'precipitation',
+    'snow_depth',
+    'snowfall',
+    'max_temperature',
+    'min_temperature',
+    'average_wind_speed',
+    'pickup_nyct2010_gid',
+    'pickup_ctlabel',
+    'pickup_borocode',
+    'pickup_boroname',
+    'pickup_ct2010',
+    'pickup_boroct2010',
+    'pickup_cdeligibil',
+    'pickup_ntacode',
+    'pickup_ntaname',
+    'pickup_puma',
+    'dropoff_nyct2010_gid',
+    'dropoff_ctlabel',
+    'dropoff_borocode',
+    'dropoff_boroname',
+    'dropoff_ct2010',
+    'dropoff_boroct2010',
+    'dropoff_cdeligibil',
+    'dropoff_ntacode',
+    'dropoff_ntaname',
+    'dropoff_puma',
+  ],
+};
+
+export const EXAMPLE_INPUTS: ExampleInput[] = [
   {
     name: 'Wikipedia',
     description: 'One day of wikipedia edits (JSON)',
@@ -62,6 +122,8 @@ export const EXAMPLE_INPUT_SOURCES: ExampleInputSource[] = [
         'https://static.imply.io/example-data/trips/trips_xac.csv.gz',
       ],
     },
+    inputFormat: TRIPS_INPUT_FORMAT,
+    partitionedByHint: 'month',
   },
   {
     name: 'NYC Taxi cabs (all files)',
@@ -145,6 +207,8 @@ export const EXAMPLE_INPUT_SOURCES: ExampleInputSource[] = [
         'https://static.imply.io/example-data/trips/trips_xcv.csv.gz',
       ],
     },
+    inputFormat: TRIPS_INPUT_FORMAT,
+    partitionedByHint: 'month',
   },
   {
     name: 'FlightCarrierOnTime (1 month)',
diff --git a/web-console/src/views/workbench-view/input-source-step/input-source-step.tsx b/web-console/src/views/workbench-view/input-source-step/input-source-step.tsx
index 211271c62c3d..9ea55fd0d17c 100644
--- a/web-console/src/views/workbench-view/input-source-step/input-source-step.tsx
+++ b/web-console/src/views/workbench-view/input-source-step/input-source-step.tsx
@@ -55,7 +55,7 @@ import { UrlBaser } from '../../../singletons';
 import { filterMap, IntermediateQueryState } from '../../../utils';
 import { postToSampler, SampleSpec } from '../../../utils/sampler';
 
-import { EXAMPLE_INPUT_SOURCES } from './example-inputs';
+import { EXAMPLE_INPUTS } from './example-inputs';
 import { InputSourceInfo } from './input-source-info';
 
 import './input-source-step.scss';
@@ -71,7 +71,11 @@ const ROWS_TO_SAMPLE = 50;
 export interface InputSourceStepProps {
   initInputSource: Partial<InputSource> | undefined;
   mode: 'sampler' | 'msq';
-  onSet(inputSource: InputSource, inputFormat: InputFormat): void;
+  onSet(
+    inputSource: InputSource,
+    inputFormat: InputFormat,
+    partitionedByHint: string | undefined,
+  ): void;
 }
 
 export const InputSourceStep = React.memo(function InputSourceStep(props: InputSourceStepProps) {
@@ -81,16 +85,15 @@ export const InputSourceStep = React.memo(function InputSourceStep(props: InputS
   const [inputSource, setInputSource] = useState<Partial<InputSource> | string | undefined>(
     initInputSource,
   );
-  const exampleInputSource = EXAMPLE_INPUT_SOURCES.find(
-    ({ name }) => name === inputSource,
-  )?.inputSource;
+  const exampleInput = EXAMPLE_INPUTS.find(({ name }) => name === inputSource);
 
   const [guessedInputFormatState, connectQueryManager] = useQueryManager<
-    InputSource,
+    { inputSource: InputSource; suggestedInputFormat?: InputFormat },
     InputFormat,
     Execution
   >({
-    processQuery: async (inputSource: InputSource, cancelToken) => {
+    processQuery: async ({ inputSource, suggestedInputFormat }, cancelToken) => {
+      let guessedInputFormat: InputFormat | undefined;
       if (mode === 'sampler') {
         const sampleSpec: SampleSpec = {
           type: 'index_parallel',
@@ -127,7 +130,7 @@ export const InputSourceStep = React.memo(function InputSourceStep(props: InputS
         );
 
         if (!sampleLines.length) throw new Error('No data returned from sampler');
-        return guessInputFormat(sampleLines);
+        guessedInputFormat = guessInputFormat(sampleLines);
       } else {
         const tableExpression = externalConfigToTableExpression({
           inputSource,
@@ -151,8 +154,14 @@ export const InputSourceStep = React.memo(function InputSourceStep(props: InputS
         );
 
         if (result instanceof IntermediateQueryState) return result;
-        return resultToInputFormat(result);
+        guessedInputFormat = resultToInputFormat(result);
       }
+
+      if (suggestedInputFormat?.type === guessedInputFormat.type) {
+        return suggestedInputFormat;
+      }
+
+      return guessedInputFormat;
     },
     backgroundStatusCheck: async (execution, query, cancelToken) => {
       const result = await executionBackgroundResultStatusCheck(execution, query, cancelToken);
@@ -164,7 +173,11 @@ export const InputSourceStep = React.memo(function InputSourceStep(props: InputS
   useEffect(() => {
     const guessedInputFormat = guessedInputFormatState.data;
     if (!guessedInputFormat) return;
-    onSet(exampleInputSource || (inputSource as any), guessedInputFormat);
+    onSet(
+      exampleInput?.inputSource || (inputSource as any),
+      guessedInputFormat,
+      exampleInput?.partitionedByHint,
+    );
     // eslint-disable-next-line react-hooks/exhaustive-deps
   }, [guessedInputFormatState]);
 
@@ -217,7 +230,7 @@ export const InputSourceStep = React.memo(function InputSourceStep(props: InputS
                   selectedValue={inputSource}
                   onChange={e => setInputSource(e.currentTarget.value)}
                 >
-                  {EXAMPLE_INPUT_SOURCES.map((e, i) => (
+                  {EXAMPLE_INPUTS.map((e, i) => (
                     <Radio
                       key={i}
                       labelElement={
@@ -306,10 +319,13 @@ export const InputSourceStep = React.memo(function InputSourceStep(props: InputS
               text={guessedInputFormatState.isLoading() ? 'Loading...' : 'Use example'}
               rightIcon={IconNames.ARROW_RIGHT}
               intent={Intent.PRIMARY}
-              disabled={!exampleInputSource || guessedInputFormatState.isLoading()}
+              disabled={!exampleInput || guessedInputFormatState.isLoading()}
               onClick={() => {
-                if (!exampleInputSource) return;
-                connectQueryManager.runQuery(exampleInputSource);
+                if (!exampleInput) return;
+                connectQueryManager.runQuery({
+                  inputSource: exampleInput.inputSource,
+                  suggestedInputFormat: exampleInput.inputFormat,
+                });
               }}
             />
           ) : inputSource ? (
@@ -324,7 +340,7 @@ export const InputSourceStep = React.memo(function InputSourceStep(props: InputS
               }
               onClick={() => {
                 if (!AutoForm.isValidModel(inputSource, INPUT_SOURCE_FIELDS)) return;
-                connectQueryManager.runQuery(inputSource);
+                connectQueryManager.runQuery({ inputSource });
               }}
             />
           ) : undefined}
diff --git a/web-console/src/views/workbench-view/run-panel/run-panel.tsx b/web-console/src/views/workbench-view/run-panel/run-panel.tsx
index 572120c9e730..7299760b4621 100644
--- a/web-console/src/views/workbench-view/run-panel/run-panel.tsx
+++ b/web-console/src/views/workbench-view/run-panel/run-panel.tsx
@@ -33,6 +33,7 @@ import React, { useCallback, useMemo, useState } from 'react';
 
 import { MenuCheckbox, MenuTristate } from '../../../components';
 import { EditContextDialog, StringInputDialog } from '../../../dialogs';
+import { IndexSpecDialog } from '../../../dialogs/index-spec-dialog/index-spec-dialog';
 import {
   changeDurableShuffleStorage,
   changeFinalizeAggregations,
@@ -51,9 +52,12 @@ import {
   getUseApproximateCountDistinct,
   getUseApproximateTopN,
   getUseCache,
+  IndexSpec,
+  QueryContext,
+  summarizeIndexSpec,
   WorkbenchQuery,
 } from '../../../druid-models';
-import { pluralIfNeeded, tickIcon } from '../../../utils';
+import { deepGet, pluralIfNeeded, tickIcon } from '../../../utils';
 import { MaxTasksButton } from '../max-tasks-button/max-tasks-button';
 
 import './run-panel.scss';
@@ -94,6 +98,7 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
   const { query, onQueryChange, onRun, moreMenu, loading, small, queryEngines } = props;
   const [editContextDialogOpen, setEditContextDialogOpen] = useState(false);
   const [customTimezoneDialogOpen, setCustomTimezoneDialogOpen] = useState(false);
+  const [indexSpecDialogSpec, setIndexSpecDialogSpec] = useState<IndexSpec | undefined>();
 
   const emptyQuery = query.isEmptyQuery();
   const ingestMode = query.isIngestQuery();
@@ -104,6 +109,7 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
   const finalizeAggregations = getFinalizeAggregations(queryContext);
   const groupByEnableMultiValueUnnesting = getGroupByEnableMultiValueUnnesting(queryContext);
   const durableShuffleStorage = getDurableShuffleStorage(queryContext);
+  const indexSpec: IndexSpec | undefined = deepGet(queryContext, 'indexSpec');
   const useApproximateCountDistinct = getUseApproximateCountDistinct(queryContext);
   const useApproximateTopN = getUseApproximateTopN(queryContext);
   const useCache = getUseCache(queryContext);
@@ -157,6 +163,10 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
     );
   }
 
+  function changeQueryContext(queryContext: QueryContext) {
+    onQueryChange(query.changeQueryContext(queryContext));
+  }
+
   const availableEngines = ([undefined] as (DruidEngine | undefined)[]).concat(queryEngines);
 
   function offsetOptions(): JSX.Element[] {
@@ -170,9 +180,7 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
           icon={tickIcon(offset === timezone)}
           text={offset}
           shouldDismissPopover={false}
-          onClick={() => {
-            onQueryChange(query.changeQueryContext(changeTimezone(queryContext, offset)));
-          }}
+          onClick={() => changeQueryContext(changeTimezone(queryContext, offset))}
         />,
       );
     }
@@ -233,11 +241,7 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
                       icon={tickIcon(!timezone)}
                       text="Default"
                       shouldDismissPopover={false}
-                      onClick={() => {
-                        onQueryChange(
-                          query.changeQueryContext(changeTimezone(queryContext, undefined)),
-                        );
-                      }}
+                      onClick={() => changeQueryContext(changeTimezone(queryContext, undefined))}
                     />
                     <MenuItem icon={tickIcon(String(timezone).includes('/'))} text="Named">
                       {NAMED_TIMEZONES.map(namedTimezone => (
@@ -246,11 +250,9 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
                           icon={tickIcon(namedTimezone === timezone)}
                           text={namedTimezone}
                           shouldDismissPopover={false}
-                          onClick={() => {
-                            onQueryChange(
-                              query.changeQueryContext(changeTimezone(queryContext, namedTimezone)),
-                            );
-                          }}
+                          onClick={() =>
+                            changeQueryContext(changeTimezone(queryContext, namedTimezone))
+                          }
                         />
                       ))}
                     </MenuItem>
@@ -276,11 +278,9 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
                           key={String(v)}
                           icon={tickIcon(v === maxParseExceptions)}
                           text={v === -1 ? '∞ (-1)' : String(v)}
-                          onClick={() => {
-                            onQueryChange(
-                              query.changeQueryContext(changeMaxParseExceptions(queryContext, v)),
-                            );
-                          }}
+                          onClick={() =>
+                            changeQueryContext(changeMaxParseExceptions(queryContext, v))
+                          }
                           shouldDismissPopover={false}
                         />
                       ))}
@@ -290,35 +290,36 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
                       text="Finalize aggregations"
                       value={finalizeAggregations}
                       undefinedEffectiveValue={!ingestMode}
-                      onValueChange={v => {
-                        onQueryChange(
-                          query.changeQueryContext(changeFinalizeAggregations(queryContext, v)),
-                        );
-                      }}
+                      onValueChange={v =>
+                        changeQueryContext(changeFinalizeAggregations(queryContext, v))
+                      }
                     />
                     <MenuTristate
                       icon={IconNames.FORK}
                       text="Enable GroupBy multi-value unnesting"
                       value={groupByEnableMultiValueUnnesting}
                       undefinedEffectiveValue={!ingestMode}
-                      onValueChange={v => {
-                        onQueryChange(
-                          query.changeQueryContext(
-                            changeGroupByEnableMultiValueUnnesting(queryContext, v),
-                          ),
-                        );
+                      onValueChange={v =>
+                        changeQueryContext(changeGroupByEnableMultiValueUnnesting(queryContext, v))
+                      }
+                    />
+                    <MenuItem
+                      icon={IconNames.TH_DERIVED}
+                      text="Edit index spec"
+                      label={summarizeIndexSpec(indexSpec)}
+                      shouldDismissPopover={false}
+                      onClick={() => {
+                        setIndexSpecDialogSpec(indexSpec || {});
                       }}
                     />
                     <MenuCheckbox
                       checked={durableShuffleStorage}
                       text="Durable shuffle storage"
-                      onChange={() => {
-                        onQueryChange(
-                          query.changeQueryContext(
-                            changeDurableShuffleStorage(queryContext, !durableShuffleStorage),
-                          ),
-                        );
-                      }}
+                      onChange={() =>
+                        changeQueryContext(
+                          changeDurableShuffleStorage(queryContext, !durableShuffleStorage),
+                        )
+                      }
                     />
                   </>
                 ) : (
@@ -326,22 +327,16 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
                     <MenuCheckbox
                       checked={useCache}
                       text="Use cache"
-                      onChange={() => {
-                        onQueryChange(
-                          query.changeQueryContext(changeUseCache(queryContext, !useCache)),
-                        );
-                      }}
+                      onChange={() => changeQueryContext(changeUseCache(queryContext, !useCache))}
                     />
                     <MenuCheckbox
                       checked={useApproximateTopN}
                       text="Use approximate TopN"
-                      onChange={() => {
-                        onQueryChange(
-                          query.changeQueryContext(
-                            changeUseApproximateTopN(queryContext, !useApproximateTopN),
-                          ),
-                        );
-                      }}
+                      onChange={() =>
+                        changeQueryContext(
+                          changeUseApproximateTopN(queryContext, !useApproximateTopN),
+                        )
+                      }
                     />
                   </>
                 )}
@@ -349,16 +344,14 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
                   <MenuCheckbox
                     checked={useApproximateCountDistinct}
                     text="Use approximate COUNT(DISTINCT)"
-                    onChange={() => {
-                      onQueryChange(
-                        query.changeQueryContext(
-                          changeUseApproximateCountDistinct(
-                            queryContext,
-                            !useApproximateCountDistinct,
-                          ),
+                    onChange={() =>
+                      changeQueryContext(
+                        changeUseApproximateCountDistinct(
+                          queryContext,
+                          !useApproximateCountDistinct,
                         ),
-                      );
-                    }}
+                      )
+                    }
                   />
                 )}
                 <MenuCheckbox
@@ -382,12 +375,7 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
             />
           </Popover2>
           {effectiveEngine === 'sql-msq-task' && (
-            <MaxTasksButton
-              queryContext={queryContext}
-              changeQueryContext={queryContext =>
-                onQueryChange(query.changeQueryContext(queryContext))
-              }
-            />
+            <MaxTasksButton queryContext={queryContext} changeQueryContext={changeQueryContext} />
           )}
         </ButtonGroup>
       )}
@@ -399,10 +387,7 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
       {editContextDialogOpen && (
         <EditContextDialog
           queryContext={queryContext}
-          onQueryContextChange={newContext => {
-            if (!onQueryChange) return;
-            onQueryChange(query.changeQueryContext(newContext));
-          }}
+          onQueryContextChange={changeQueryContext}
           onClose={() => {
             setEditContextDialogOpen(false);
           }}
@@ -413,10 +398,17 @@ export const RunPanel = React.memo(function RunPanel(props: RunPanelProps) {
           title="Custom timezone"
           placeholder="Etc/UTC"
           maxLength={50}
-          onSubmit={tz => onQueryChange(query.changeQueryContext(changeTimezone(queryContext, tz)))}
+          onSubmit={tz => changeQueryContext(changeTimezone(queryContext, tz))}
           onClose={() => setCustomTimezoneDialogOpen(false)}
         />
       )}
+      {indexSpecDialogSpec && (
+        <IndexSpecDialog
+          onClose={() => setIndexSpecDialogSpec(undefined)}
+          onSave={indexSpec => changeQueryContext({ ...queryContext, indexSpec })}
+          indexSpec={indexSpecDialogSpec}
+        />
+      )}
     </div>
   );
 });
diff --git a/web-console/src/views/workbench-view/workbench-view.tsx b/web-console/src/views/workbench-view/workbench-view.tsx
index 5d601d2fb658..56af602e4321 100644
--- a/web-console/src/views/workbench-view/workbench-view.tsx
+++ b/web-console/src/views/workbench-view/workbench-view.tsx
@@ -324,9 +324,14 @@ export class WorkbenchView extends React.PureComponent<WorkbenchViewProps, Workb
 
     return (
       <ConnectExternalDataDialog
-        onSetExternalConfig={(externalConfig, isArrays, timeExpression) => {
+        onSetExternalConfig={(externalConfig, isArrays, timeExpression, partitionedByHint) => {
           this.handleNewTab(
-            WorkbenchQuery.fromInitExternalConfig(externalConfig, isArrays, timeExpression),
+            WorkbenchQuery.fromInitExternalConfig(
+              externalConfig,
+              isArrays,
+              timeExpression,
+              partitionedByHint,
+            ),
             'Ext ' + guessDataSourceNameFromInputSource(externalConfig.inputSource),
           );
         }}
diff --git a/web-console/unified-console.html b/web-console/unified-console.html
index 0f49d63d7024..e2b33fef8ada 100644
--- a/web-console/unified-console.html
+++ b/web-console/unified-console.html
@@ -71,6 +71,6 @@
       };
     </script>
     <script src="console-config.js"></script>
-    <script src="public/web-console-25.0.0.js"></script>
+    <script src="public/web-console-26.0.0.js"></script>
   </body>
 </html>
diff --git a/website/.spelling b/website/.spelling
index c27c4d8ccc80..e52ecebbc532 100644
--- a/website/.spelling
+++ b/website/.spelling
@@ -68,6 +68,9 @@ Double.NEGATIVE_INFINITY
 Double.NEGATIVE_INFINITY.
 Double.POSITIVE_INFINITY
 Double.POSITIVE_INFINITY.
+downsampled
+downsamples
+downsampling
 Dropwizard
 dropwizard
 DruidInputSource
@@ -126,6 +129,7 @@ JDK
 JDK7
 JDK8
 JKS
+jks
 JMX
 JRE
 JS
@@ -144,6 +148,7 @@ Kerberos
 KeyStores
 Kinesis
 Kubernetes
+LDAPS
 LRU
 LZ4
 LZO
@@ -200,6 +205,7 @@ SYSTEM_TABLE
 TCP
 TGT
 TLS
+tls
 TopN
 TopNs
 UI
@@ -373,6 +379,7 @@ non-nullable
 noop
 numerics
 numShards
+parameterize
 objectGlob
 parameterized
 parse_json
@@ -418,6 +425,10 @@ programmatically
 proto
 proxied
 proxyConfig
+python2
+python3
+Python2
+Python3
 QPS
 quantile
 quantiles
@@ -2291,3 +2302,8 @@ Czechia
 Zeelund
  - ../docs/tutorials/docker.md
  nano
+ - ../docs/operations/python.md
+MacOS
+RHEL
+psutil
+pathlib
diff --git a/website/pom.xml b/website/pom.xml
index a8b7bb659bdb..a071223aeeff 100644
--- a/website/pom.xml
+++ b/website/pom.xml
@@ -28,7 +28,7 @@
   <parent>
     <groupId>org.apache.druid</groupId>
     <artifactId>druid</artifactId>
-    <version>25.0.0-SNAPSHOT</version>
+    <version>26.0.0-SNAPSHOT</version>
   </parent>
 
   <properties>
diff --git a/website/sidebars.json b/website/sidebars.json
index a398f9fd3642..e0fcbf040358 100644
--- a/website/sidebars.json
+++ b/website/sidebars.json
@@ -13,7 +13,7 @@
       "tutorials/tutorial-batch-hadoop",
       "tutorials/tutorial-query",
       "tutorials/tutorial-rollup",
-      "tutorials/tutorial-sketches-theta",      
+      "tutorials/tutorial-sketches-theta",
       "tutorials/tutorial-retention",
       "tutorials/tutorial-update-data",
       "tutorials/tutorial-compaction",
@@ -22,7 +22,8 @@
       "tutorials/tutorial-transform-spec",
       "tutorials/docker",
       "tutorials/tutorial-kerberos-hadoop",
-      "tutorials/tutorial-msq-convert-spec"
+      "tutorials/tutorial-msq-convert-spec",
+      "tutorials/tutorial-jdbc"
     ],
     "Design": [
       "design/architecture",
@@ -57,6 +58,8 @@
         "ids": [
           "ingestion/native-batch",
           "ingestion/native-batch-input-sources",
+          "ingestion/migrate-from-firehose",
+          "ingestion/native-batch-firehose",
           "ingestion/hadoop"
         ]
       },