From 8c235208e6358ee0659029be198578bab75d5f37 Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Thu, 3 Dec 2020 22:01:05 -0800
Subject: [PATCH 01/14] no need for intervals

---
 .../component/load-data/config/partition.ts   |   1 -
 .../component/load-data/data-loader.ts        |   5 +-
 web-console/e2e-tests/reindexing.spec.ts      |   1 -
 web-console/e2e-tests/tutorial-batch.spec.ts  |   1 -
 .../__snapshots__/auto-form.spec.tsx.snap     |  12 +-
 .../src/components/auto-form/auto-form.tsx    |  17 +--
 .../numeric-input-with-default.spec.tsx.snap  |  19 +++
 .../numeric-input-with-default.spec.tsx       |  30 ++++
 .../numeric-input-with-default.tsx            |  51 +++++++
 .../src/druid-models/ingestion-spec.tsx       | 130 +++++++++++-------
 .../views/load-data-view/load-data-view.tsx   |  41 ++----
 11 files changed, 198 insertions(+), 110 deletions(-)
 create mode 100644 web-console/src/components/numeric-input-with-default/__snapshots__/numeric-input-with-default.spec.tsx.snap
 create mode 100644 web-console/src/components/numeric-input-with-default/numeric-input-with-default.spec.tsx
 create mode 100644 web-console/src/components/numeric-input-with-default/numeric-input-with-default.tsx

diff --git a/web-console/e2e-tests/component/load-data/config/partition.ts b/web-console/e2e-tests/component/load-data/config/partition.ts
index 375ad550745f..14197bd86533 100644
--- a/web-console/e2e-tests/component/load-data/config/partition.ts
+++ b/web-console/e2e-tests/component/load-data/config/partition.ts
@@ -164,7 +164,6 @@ export class PartitionConfig {
 
 interface PartitionConfigProps {
   readonly segmentGranularity: SegmentGranularity;
-  readonly timeIntervals: string | null;
   readonly partitionsSpec: PartitionsSpec | null;
 }
 
diff --git a/web-console/e2e-tests/component/load-data/data-loader.ts b/web-console/e2e-tests/component/load-data/data-loader.ts
index df16e7158753..8ee50a07ac3a 100644
--- a/web-console/e2e-tests/component/load-data/data-loader.ts
+++ b/web-console/e2e-tests/component/load-data/data-loader.ts
@@ -18,7 +18,7 @@
 
 import * as playwright from 'playwright-chromium';
 
-import { clickButton, setLabeledInput, setLabeledTextarea } from '../../util/playwright';
+import { clickButton, setLabeledInput } from '../../util/playwright';
 
 import { ConfigureSchemaConfig } from './config/configure-schema';
 import { PartitionConfig } from './config/partition';
@@ -125,9 +125,6 @@ export class DataLoader {
 
   private async applyPartitionConfig(partitionConfig: PartitionConfig) {
     await setLabeledInput(this.page, 'Segment granularity', partitionConfig.segmentGranularity);
-    if (partitionConfig.timeIntervals) {
-      await setLabeledTextarea(this.page, 'Time intervals', partitionConfig.timeIntervals);
-    }
     if (partitionConfig.partitionsSpec != null) {
       await partitionConfig.partitionsSpec.apply(this.page);
     }
diff --git a/web-console/e2e-tests/reindexing.spec.ts b/web-console/e2e-tests/reindexing.spec.ts
index ae45b735965f..a935373b7833 100644
--- a/web-console/e2e-tests/reindexing.spec.ts
+++ b/web-console/e2e-tests/reindexing.spec.ts
@@ -67,7 +67,6 @@ describe('Reindexing from Druid', () => {
     const configureSchemaConfig = new ConfigureSchemaConfig({ rollup: false });
     const partitionConfig = new PartitionConfig({
       segmentGranularity: SegmentGranularity.DAY,
-      timeIntervals: interval,
       partitionsSpec: new SingleDimPartitionsSpec({
         partitionDimension: 'channel',
         targetRowsPerSegment: 10_000,
diff --git a/web-console/e2e-tests/tutorial-batch.spec.ts b/web-console/e2e-tests/tutorial-batch.spec.ts
index f4fa45054632..2f4e06b8011a 100644
--- a/web-console/e2e-tests/tutorial-batch.spec.ts
+++ b/web-console/e2e-tests/tutorial-batch.spec.ts
@@ -64,7 +64,6 @@ describe('Tutorial: Loading a file', () => {
     const configureSchemaConfig = new ConfigureSchemaConfig({ rollup: false });
     const partitionConfig = new PartitionConfig({
       segmentGranularity: SegmentGranularity.DAY,
-      timeIntervals: null,
       partitionsSpec: null,
     });
     const publishConfig = new PublishConfig({ datasourceName: datasourceName });
diff --git a/web-console/src/components/auto-form/__snapshots__/auto-form.spec.tsx.snap b/web-console/src/components/auto-form/__snapshots__/auto-form.spec.tsx.snap
index baf1011bdc8e..02a63a1b1074 100644
--- a/web-console/src/components/auto-form/__snapshots__/auto-form.spec.tsx.snap
+++ b/web-console/src/components/auto-form/__snapshots__/auto-form.spec.tsx.snap
@@ -8,23 +8,13 @@ exports[`AutoForm matches snapshot 1`] = `
     key="testOne"
     label="Test one"
   >
-    <Blueprint3.NumericInput
-      allowNumericCharactersOnly={true}
-      buttonPosition="right"
-      clampValueOnBlur={false}
-      defaultValue=""
+    <Memo(NumericInputWithDefault)
       disabled={false}
       fill={true}
-      large={false}
-      majorStepSize={10}
       min={0}
-      minorStepSize={0.1}
       onBlur={[Function]}
       onValueChange={[Function]}
       placeholder=""
-      selectAllOnFocus={false}
-      selectAllOnIncrement={false}
-      stepSize={1}
     />
   </Memo(FormGroupWithInfo)>
   <Memo(FormGroupWithInfo)
diff --git a/web-console/src/components/auto-form/auto-form.tsx b/web-console/src/components/auto-form/auto-form.tsx
index 3b2f6c0da0e5..51e910829b0e 100644
--- a/web-console/src/components/auto-form/auto-form.tsx
+++ b/web-console/src/components/auto-form/auto-form.tsx
@@ -25,6 +25,7 @@ import { ArrayInput } from '../array-input/array-input';
 import { FormGroupWithInfo } from '../form-group-with-info/form-group-with-info';
 import { IntervalInput } from '../interval-input/interval-input';
 import { JsonInput } from '../json-input/json-input';
+import { NumericInputWithDefault } from '../numeric-input-with-default/numeric-input-with-default';
 import { PopoverText } from '../popover-text/popover-text';
 import { SuggestibleInput, Suggestion } from '../suggestible-input/suggestible-input';
 
@@ -198,17 +199,17 @@ export class AutoForm<T extends Record<string, any>> extends React.PureComponent
   private renderNumberInput(field: Field<T>): JSX.Element {
     const { model, large, onFinalize } = this.props;
 
-    let modelValue = deepGet(model as any, field.name);
-    if (typeof modelValue !== 'number') modelValue = field.defaultValue;
+    const modelValue = deepGet(model as any, field.name);
     return (
-      <NumericInput
+      <NumericInputWithDefault
         value={modelValue}
+        defaultValue={field.defaultValue}
         onValueChange={(valueAsNumber: number, valueAsString: string) => {
-          if (valueAsString === '' || isNaN(valueAsNumber)) return;
-          this.fieldChange(
-            field,
-            valueAsNumber === 0 && field.zeroMeansUndefined ? undefined : valueAsNumber,
-          );
+          let newValue: number | undefined;
+          if (valueAsString !== '' && !isNaN(valueAsNumber)) {
+            newValue = valueAsNumber === 0 && field.zeroMeansUndefined ? undefined : valueAsNumber;
+          }
+          this.fieldChange(field, newValue);
         }}
         onBlur={e => {
           if (e.target.value === '') {
diff --git a/web-console/src/components/numeric-input-with-default/__snapshots__/numeric-input-with-default.spec.tsx.snap b/web-console/src/components/numeric-input-with-default/__snapshots__/numeric-input-with-default.spec.tsx.snap
new file mode 100644
index 000000000000..75335f79dcb5
--- /dev/null
+++ b/web-console/src/components/numeric-input-with-default/__snapshots__/numeric-input-with-default.spec.tsx.snap
@@ -0,0 +1,19 @@
+// Jest Snapshot v1, https://goo.gl/fbAQLP
+
+exports[`NumericInputWithDefault matches snapshot 1`] = `
+<Blueprint3.NumericInput
+  allowNumericCharactersOnly={true}
+  buttonPosition="right"
+  clampValueOnBlur={false}
+  defaultValue=""
+  large={false}
+  majorStepSize={10}
+  minorStepSize={0.1}
+  onBlur={[Function]}
+  onValueChange={[Function]}
+  selectAllOnFocus={false}
+  selectAllOnIncrement={false}
+  stepSize={1}
+  value={5}
+/>
+`;
diff --git a/web-console/src/components/numeric-input-with-default/numeric-input-with-default.spec.tsx b/web-console/src/components/numeric-input-with-default/numeric-input-with-default.spec.tsx
new file mode 100644
index 000000000000..b0d2b61d2ce9
--- /dev/null
+++ b/web-console/src/components/numeric-input-with-default/numeric-input-with-default.spec.tsx
@@ -0,0 +1,30 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import { shallow } from 'enzyme';
+import React from 'react';
+
+import { NumericInputWithDefault } from './numeric-input-with-default';
+
+describe('NumericInputWithDefault', () => {
+  it('matches snapshot', () => {
+    const numericInputWithDefault = shallow(<NumericInputWithDefault value={5} defaultValue={3} />);
+
+    expect(numericInputWithDefault).toMatchSnapshot();
+  });
+});
diff --git a/web-console/src/components/numeric-input-with-default/numeric-input-with-default.tsx b/web-console/src/components/numeric-input-with-default/numeric-input-with-default.tsx
new file mode 100644
index 000000000000..f4d0b4e07990
--- /dev/null
+++ b/web-console/src/components/numeric-input-with-default/numeric-input-with-default.tsx
@@ -0,0 +1,51 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import { HTMLInputProps, INumericInputProps, NumericInput } from '@blueprintjs/core';
+import React, { useState } from 'react';
+
+export type NumericInputWithDefaultProps = HTMLInputProps & INumericInputProps;
+
+export const NumericInputWithDefault = React.memo(function NumericInputWithDefault(
+  props: NumericInputWithDefaultProps,
+) {
+  const { value, defaultValue, onValueChange, onBlur, ...rest } = props;
+  const [hasChanged, setHasChanged] = useState(false);
+
+  let effectiveValue = value;
+  if (effectiveValue == null) {
+    effectiveValue = hasChanged ? '' : defaultValue || '';
+  }
+
+  return (
+    <NumericInput
+      value={effectiveValue}
+      onValueChange={(valueAsNumber, valueAsString, inputElement) => {
+        setHasChanged(true);
+        if (!onValueChange) return;
+        return onValueChange(valueAsNumber, valueAsString, inputElement);
+      }}
+      onBlur={e => {
+        setHasChanged(false);
+        if (!onBlur) return;
+        return onBlur(e);
+      }}
+      {...rest}
+    />
+  );
+});
diff --git a/web-console/src/druid-models/ingestion-spec.tsx b/web-console/src/druid-models/ingestion-spec.tsx
index baa8b50729ea..bfae30420c1d 100644
--- a/web-console/src/druid-models/ingestion-spec.tsx
+++ b/web-console/src/druid-models/ingestion-spec.tsx
@@ -1340,33 +1340,31 @@ export interface PartitionsSpec {
   assumeGrouped?: boolean;
 }
 
-export function adjustTuningConfig(tuningConfig: TuningConfig) {
-  const tuningConfigType = deepGet(tuningConfig, 'type');
-  if (tuningConfigType !== 'index_parallel') return tuningConfig;
+export function adjustTuningConfig(spec: IngestionSpec) {
+  const tuningConfigType = deepGet(spec, 'spec.tuningConfig.type');
+  if (tuningConfigType !== 'index_parallel') return spec;
 
-  const partitionsSpecType = deepGet(tuningConfig, 'partitionsSpec.type') || 'dynamic';
+  const partitionsSpecType = deepGet(spec, 'spec.tuningConfig.partitionsSpec.type') || 'dynamic';
   if (partitionsSpecType === 'dynamic') {
-    tuningConfig = deepDelete(tuningConfig, 'forceGuaranteedRollup');
+    spec = deepDelete(spec, 'spec.tuningConfig.forceGuaranteedRollup');
   } else if (oneOf(partitionsSpecType, 'hashed', 'single_dim')) {
-    tuningConfig = deepSet(tuningConfig, 'forceGuaranteedRollup', true);
+    spec = deepSet(spec, 'spec.tuningConfig.forceGuaranteedRollup', true);
   }
 
-  return tuningConfig;
+  return spec;
 }
 
-export function invalidTuningConfig(tuningConfig: TuningConfig, intervals: any): boolean {
+export function invalidTuningConfig(tuningConfig: TuningConfig): boolean {
   if (tuningConfig.type !== 'index_parallel') return false;
 
   switch (deepGet(tuningConfig, 'partitionsSpec.type')) {
     case 'hashed':
-      if (!intervals) return true;
       return (
         Boolean(deepGet(tuningConfig, 'partitionsSpec.targetRowsPerSegment')) &&
         Boolean(deepGet(tuningConfig, 'partitionsSpec.numShards'))
       );
 
     case 'single_dim':
-      if (!intervals) return true;
       if (!deepGet(tuningConfig, 'partitionsSpec.partitionDimension')) return true;
       const hasTargetRowsPerSegment = Boolean(
         deepGet(tuningConfig, 'partitionsSpec.targetRowsPerSegment'),
@@ -1383,14 +1381,15 @@ export function invalidTuningConfig(tuningConfig: TuningConfig, intervals: any):
 }
 
 export function getPartitionRelatedTuningSpecFormFields(
-  specType: IngestionType,
+  spec: IngestionSpec,
   dimensionSuggestions: string[] | undefined,
-): Field<TuningConfig>[] {
+): Field<IngestionSpec>[] {
+  const specType = getSpecType(spec) || 'index_parallel';
   switch (specType) {
     case 'index_parallel':
-      return [
+      const parallelFields: Field<IngestionSpec>[] = [
         {
-          name: 'partitionsSpec.type',
+          name: 'spec.tuningConfig.partitionsSpec.type',
           label: 'Partitioning type',
           type: 'string',
           required: true,
@@ -1402,38 +1401,42 @@ export function getPartitionRelatedTuningSpecFormFields(
               single dimension). For best-effort rollup, you should use <Code>dynamic</Code>.
             </p>
           ),
-          adjustment: (t: TuningConfig) => {
-            if (!Array.isArray(dimensionSuggestions) || !dimensionSuggestions.length) return t;
-            return deepSet(t, 'partitionsSpec.partitionDimension', dimensionSuggestions[0]);
+          adjustment: s => {
+            if (!Array.isArray(dimensionSuggestions) || !dimensionSuggestions.length) return s;
+            return deepSet(
+              s,
+              'spec.tuningConfig.partitionsSpec.partitionDimension',
+              dimensionSuggestions[0],
+            );
           },
         },
         // partitionsSpec type: dynamic
         {
-          name: 'partitionsSpec.maxRowsPerSegment',
+          name: 'spec.tuningConfig.partitionsSpec.maxRowsPerSegment',
           label: 'Max rows per segment',
           type: 'number',
           defaultValue: 5000000,
-          defined: (t: TuningConfig) => deepGet(t, 'partitionsSpec.type') === 'dynamic',
+          defined: s => deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'dynamic',
           info: <>Determines how many rows are in each segment.</>,
         },
         {
-          name: 'partitionsSpec.maxTotalRows',
+          name: 'spec.tuningConfig.partitionsSpec.maxTotalRows',
           label: 'Max total rows',
           type: 'number',
           defaultValue: 20000000,
-          defined: (t: TuningConfig) => deepGet(t, 'partitionsSpec.type') === 'dynamic',
+          defined: s => deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'dynamic',
           info: <>Total number of rows in segments waiting for being pushed.</>,
         },
         // partitionsSpec type: hashed
         {
-          name: 'partitionsSpec.targetRowsPerSegment',
+          name: 'spec.tuningConfig.partitionsSpec.targetRowsPerSegment',
           label: 'Target rows per segment',
           type: 'number',
           zeroMeansUndefined: true,
           defaultValue: 5000000,
-          defined: (t: TuningConfig) =>
-            deepGet(t, 'partitionsSpec.type') === 'hashed' &&
-            !deepGet(t, 'partitionsSpec.numShards'),
+          defined: s =>
+            deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'hashed' &&
+            !deepGet(s, 'spec.tuningConfig.partitionsSpec.numShards'),
           info: (
             <>
               <p>
@@ -1449,14 +1452,14 @@ export function getPartitionRelatedTuningSpecFormFields(
           ),
         },
         {
-          name: 'partitionsSpec.numShards',
+          name: 'spec.tuningConfig.partitionsSpec.numShards',
           label: 'Num shards',
           type: 'number',
           zeroMeansUndefined: true,
           hideInMore: true,
-          defined: (t: TuningConfig) =>
-            deepGet(t, 'partitionsSpec.type') === 'hashed' &&
-            !deepGet(t, 'partitionsSpec.targetRowsPerSegment'),
+          defined: s =>
+            deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'hashed' &&
+            !deepGet(s, 'spec.tuningConfig.partitionsSpec.targetRowsPerSegment'),
           info: (
             <>
               <p>
@@ -1472,19 +1475,19 @@ export function getPartitionRelatedTuningSpecFormFields(
           ),
         },
         {
-          name: 'partitionsSpec.partitionDimensions',
+          name: 'spec.tuningConfig.partitionsSpec.partitionDimensions',
           label: 'Partition dimensions',
           type: 'string-array',
           placeholder: '(all dimensions)',
-          defined: (t: TuningConfig) => deepGet(t, 'partitionsSpec.type') === 'hashed',
+          defined: s => deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'hashed',
           info: <p>The dimensions to partition on. Leave blank to select all dimensions.</p>,
         },
         // partitionsSpec type: single_dim
         {
-          name: 'partitionsSpec.partitionDimension',
+          name: 'spec.tuningConfig.partitionsSpec.partitionDimension',
           label: 'Partition dimension',
           type: 'string',
-          defined: (t: TuningConfig) => deepGet(t, 'partitionsSpec.type') === 'single_dim',
+          defined: s => deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'single_dim',
           required: true,
           suggestions: dimensionSuggestions,
           info: (
@@ -1501,16 +1504,16 @@ export function getPartitionRelatedTuningSpecFormFields(
           ),
         },
         {
-          name: 'partitionsSpec.targetRowsPerSegment',
+          name: 'spec.tuningConfig.partitionsSpec.targetRowsPerSegment',
           label: 'Target rows per segment',
           type: 'number',
           zeroMeansUndefined: true,
-          defined: (t: TuningConfig) =>
-            deepGet(t, 'partitionsSpec.type') === 'single_dim' &&
-            !deepGet(t, 'partitionsSpec.maxRowsPerSegment'),
-          required: (t: TuningConfig) =>
-            !deepGet(t, 'partitionsSpec.targetRowsPerSegment') &&
-            !deepGet(t, 'partitionsSpec.maxRowsPerSegment'),
+          defined: s =>
+            deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'single_dim' &&
+            !deepGet(s, 'spec.tuningConfig.partitionsSpec.maxRowsPerSegment'),
+          required: s =>
+            !deepGet(s, 'spec.tuningConfig.partitionsSpec.targetRowsPerSegment') &&
+            !deepGet(s, 'spec.tuningConfig.partitionsSpec.maxRowsPerSegment'),
           info: (
             <p>
               Target number of rows to include in a partition, should be a number that targets
@@ -1519,24 +1522,25 @@ export function getPartitionRelatedTuningSpecFormFields(
           ),
         },
         {
-          name: 'partitionsSpec.maxRowsPerSegment',
+          name: 'spec.tuningConfig.partitionsSpec.maxRowsPerSegment',
           label: 'Max rows per segment',
           type: 'number',
           zeroMeansUndefined: true,
-          defined: (t: TuningConfig) =>
-            deepGet(t, 'partitionsSpec.type') === 'single_dim' &&
-            !deepGet(t, 'partitionsSpec.targetRowsPerSegment'),
-          required: (t: TuningConfig) =>
-            !deepGet(t, 'partitionsSpec.targetRowsPerSegment') &&
-            !deepGet(t, 'partitionsSpec.maxRowsPerSegment'),
+          defined: s =>
+            deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'single_dim' &&
+            !deepGet(s, 'spec.tuningConfig.partitionsSpec.targetRowsPerSegment'),
+          required: s =>
+            !deepGet(s, 'spec.tuningConfig.partitionsSpec.targetRowsPerSegment') &&
+            !deepGet(s, 'spec.tuningConfig.partitionsSpec.maxRowsPerSegment'),
           info: <p>Maximum number of rows to include in a partition.</p>,
         },
         {
-          name: 'partitionsSpec.assumeGrouped',
+          name: 'spec.tuningConfig.partitionsSpec.assumeGrouped',
           label: 'Assume grouped',
           type: 'boolean',
           defaultValue: false,
-          defined: (t: TuningConfig) => deepGet(t, 'partitionsSpec.type') === 'single_dim',
+          hideInMore: true,
+          defined: s => deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'single_dim',
           info: (
             <p>
               Assume that input data has already been grouped on time and dimensions. Ingestion will
@@ -1546,17 +1550,41 @@ export function getPartitionRelatedTuningSpecFormFields(
         },
       ];
 
+      if (oneOf(deepGet(spec, 'spec.tuningConfig.partitionsSpec.type'), 'hashed', 'single_dim')) {
+        parallelFields.push({
+          name: 'spec.dataSchema.granularitySpec.intervals',
+          label: 'Time intervals',
+          type: 'string-array',
+          placeholder: 'ex: 2018-01-01/2018-06-01',
+          hideInMore: true,
+          info: (
+            <>
+              <p>A comma separated list of intervals for the raw data being ingested.</p>
+              <p>
+                This list is used to determine the shards that will be created. If it is not
+                specified then then an additional job will run to automatically determine the data
+                intervals used.
+              </p>
+            </>
+          ),
+        });
+      }
+
+      return parallelFields;
+
     case 'kafka':
     case 'kinesis':
       return [
         {
-          name: 'maxRowsPerSegment',
+          name: 'spec.tuningConfig.maxRowsPerSegment',
+          label: 'Max rows per segment',
           type: 'number',
           defaultValue: 5000000,
           info: <>Determines how many rows are in each segment.</>,
         },
         {
-          name: 'maxTotalRows',
+          name: 'spec.tuningConfig.maxTotalRows',
+          label: 'Max total rows',
           type: 'number',
           defaultValue: 20000000,
           info: <>Total number of rows in segments waiting for being pushed.</>,
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 75b427a3e7de..31bb54ca4970 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -2214,7 +2214,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
               },
             ]}
             model={spec}
-            onChange={s => this.updateSpec(s)}
+            onChange={this.updateSpec}
           />
           <FormGroup label="Extra filter">
             <JsonInput
@@ -2415,7 +2415,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
                     },
                   ]}
                   model={spec}
-                  onChange={s => this.updateSpec(s)}
+                  onChange={this.updateSpec}
                 />
               )}
               <FormGroupWithInfo
@@ -2922,7 +2922,6 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
     const tuningConfig: TuningConfig = deepGet(spec, 'spec.tuningConfig') || EMPTY_OBJECT;
     const granularitySpec: GranularitySpec =
       deepGet(spec, 'spec.dataSchema.granularitySpec') || EMPTY_OBJECT;
-    const isStreaming = oneOf(spec.type, 'kafka', 'kinesis');
     const dimensions: (string | DimensionSpec)[] | undefined = deepGet(
       spec,
       'spec.dataSchema.dimensionsSpec.dimensions',
@@ -3011,36 +3010,14 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
             model={granularitySpec}
             onChange={g => this.updateSpec(deepSet(spec, 'spec.dataSchema.granularitySpec', g))}
           />
-          {!isStreaming && (
-            <AutoForm
-              fields={[
-                {
-                  name: 'spec.dataSchema.granularitySpec.intervals',
-                  label: 'Time intervals',
-                  type: 'string-array',
-                  placeholder: 'ex: 2018-01-01/2018-06-01',
-                  required: spec =>
-                    ['hashed', 'single_dim'].includes(
-                      deepGet(spec, 'spec.tuningConfig.partitionsSpec.type'),
-                    ),
-                  info: <>A comma separated list of intervals for the raw data being ingested.</>,
-                },
-              ]}
-              model={spec}
-              onChange={s => this.updateSpec(s)}
-            />
-          )}
         </div>
         <div className="other">
           <H5>Secondary partitioning</H5>
           <AutoForm
-            fields={getPartitionRelatedTuningSpecFormFields(
-              getSpecType(spec) || 'index_parallel',
-              dimensionNames,
-            )}
-            model={tuningConfig}
+            fields={getPartitionRelatedTuningSpecFormFields(spec, dimensionNames)}
+            model={spec}
             globalAdjustment={adjustTuningConfig}
-            onChange={t => this.updateSpec(deepSet(spec, 'spec.tuningConfig', t))}
+            onChange={this.updateSpec}
           />
         </div>
         <div className="control">
@@ -3048,9 +3025,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
           {nonsensicalSingleDimPartitioningMessage}
         </div>
         {this.renderNextBar({
-          disabled:
-            !granularitySpec.segmentGranularity ||
-            invalidTuningConfig(tuningConfig, granularitySpec.intervals),
+          disabled: !granularitySpec.segmentGranularity || invalidTuningConfig(tuningConfig),
         })}
       </>
     );
@@ -3148,7 +3123,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
               },
             ]}
             model={spec}
-            onChange={s => this.updateSpec(s)}
+            onChange={this.updateSpec}
           />
         </div>
         <div className="other">
@@ -3202,7 +3177,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
               },
             ]}
             model={spec}
-            onChange={s => this.updateSpec(s)}
+            onChange={this.updateSpec}
           />
         </div>
         <div className="control">

From 14b8f7f00040271e36f115b27944b39a72ef74bf Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Sun, 6 Dec 2020 15:26:27 -0800
Subject: [PATCH 02/14] don't set redundant fields

---
 .../src/druid-models/ingestion-spec.tsx       | 88 +++++++++++--------
 web-console/src/utils/object-change.ts        |  5 ++
 .../views/load-data-view/load-data-view.tsx   | 63 ++++---------
 3 files changed, 73 insertions(+), 83 deletions(-)

diff --git a/web-console/src/druid-models/ingestion-spec.tsx b/web-console/src/druid-models/ingestion-spec.tsx
index bfae30420c1d..2a93825b9aab 100644
--- a/web-console/src/druid-models/ingestion-spec.tsx
+++ b/web-console/src/druid-models/ingestion-spec.tsx
@@ -19,13 +19,14 @@
 import { Code } from '@blueprintjs/core';
 import React from 'react';
 
-import { ExternalLink, Field } from '../components';
+import { AutoForm, ExternalLink, Field } from '../components';
 import { getLink } from '../links';
 import {
   deepDelete,
   deepGet,
   deepMove,
   deepSet,
+  deepSetIfUnset,
   EMPTY_ARRAY,
   EMPTY_OBJECT,
   filterMap,
@@ -290,11 +291,9 @@ export function normalizeSpec(spec: Partial<IngestionSpec>): IngestionSpec {
     deepGet(spec, 'spec.tuningConfig.type');
 
   if (!specType) return spec as IngestionSpec;
-  if (!deepGet(spec, 'type')) spec = deepSet(spec, 'type', specType);
-  if (!deepGet(spec, 'spec.ioConfig.type')) spec = deepSet(spec, 'spec.ioConfig.type', specType);
-  if (!deepGet(spec, 'spec.tuningConfig.type')) {
-    spec = deepSet(spec, 'spec.tuningConfig.type', specType);
-  }
+  spec = deepSetIfUnset(spec, 'type', specType);
+  spec = deepSetIfUnset(spec, 'spec.ioConfig.type', specType);
+  spec = deepSetIfUnset(spec, 'spec.tuningConfig.type', specType);
   return spec as IngestionSpec;
 }
 
@@ -1340,9 +1339,8 @@ export interface PartitionsSpec {
   assumeGrouped?: boolean;
 }
 
-export function adjustTuningConfig(spec: IngestionSpec) {
-  const tuningConfigType = deepGet(spec, 'spec.tuningConfig.type');
-  if (tuningConfigType !== 'index_parallel') return spec;
+export function adjustForceGuaranteedRollup(spec: IngestionSpec) {
+  if (getSpecType(spec) !== 'index_parallel') return spec;
 
   const partitionsSpecType = deepGet(spec, 'spec.tuningConfig.partitionsSpec.type') || 'dynamic';
   if (partitionsSpecType === 'dynamic') {
@@ -1354,37 +1352,38 @@ export function adjustTuningConfig(spec: IngestionSpec) {
   return spec;
 }
 
-export function invalidTuningConfig(tuningConfig: TuningConfig): boolean {
-  if (tuningConfig.type !== 'index_parallel') return false;
-
-  switch (deepGet(tuningConfig, 'partitionsSpec.type')) {
-    case 'hashed':
-      return (
-        Boolean(deepGet(tuningConfig, 'partitionsSpec.targetRowsPerSegment')) &&
-        Boolean(deepGet(tuningConfig, 'partitionsSpec.numShards'))
-      );
-
-    case 'single_dim':
-      if (!deepGet(tuningConfig, 'partitionsSpec.partitionDimension')) return true;
-      const hasTargetRowsPerSegment = Boolean(
-        deepGet(tuningConfig, 'partitionsSpec.targetRowsPerSegment'),
-      );
-      const hasMaxRowsPerSegment = Boolean(
-        deepGet(tuningConfig, 'partitionsSpec.maxRowsPerSegment'),
-      );
-      if (hasTargetRowsPerSegment === hasMaxRowsPerSegment) {
-        return true;
-      }
-  }
-
-  return false;
+export function invalidPartitionConfig(spec: IngestionSpec): boolean {
+  return (
+    // Bad primary partitioning, or...
+    !deepGet(spec, 'spec.dataSchema.granularitySpec.segmentGranularity') ||
+    // Bad secondary partitioning
+    Boolean(AutoForm.issueWithModel(spec, getSecondaryPartitionRelatedFormFields(spec, undefined)))
+  );
 }
 
-export function getPartitionRelatedTuningSpecFormFields(
+export const PRIMARY_PARTITION_RELATED_FORM_FIELDS: Field<IngestionSpec>[] = [
+  {
+    name: 'spec.dataSchema.granularitySpec.segmentGranularity',
+    type: 'string',
+    suggestions: ['hour', 'day', 'week', 'month', 'year'],
+    defined: s => deepGet(s, 'spec.dataSchema.granularitySpec.type') === 'uniform',
+    required: true,
+    info: (
+      <>
+        The granularity to create time chunks at. Multiple segments can be created per time chunk.
+        For example, with 'DAY' segmentGranularity, the events of the same day fall into the same
+        time chunk which can be optionally further partitioned into multiple segments based on other
+        configurations and input size.
+      </>
+    ),
+  },
+];
+
+export function getSecondaryPartitionRelatedFormFields(
   spec: IngestionSpec,
   dimensionSuggestions: string[] | undefined,
 ): Field<IngestionSpec>[] {
-  const specType = getSpecType(spec) || 'index_parallel';
+  const specType = getSpecType(spec);
   switch (specType) {
     case 'index_parallel':
       const parallelFields: Field<IngestionSpec>[] = [
@@ -1402,7 +1401,14 @@ export function getPartitionRelatedTuningSpecFormFields(
             </p>
           ),
           adjustment: s => {
-            if (!Array.isArray(dimensionSuggestions) || !dimensionSuggestions.length) return s;
+            if (
+              deepGet(s, 'spec.tuningConfig.partitionsSpec.type') !== 'single_dim' ||
+              !Array.isArray(dimensionSuggestions) ||
+              !dimensionSuggestions.length
+            ) {
+              return s;
+            }
+
             return deepSet(
               s,
               'spec.tuningConfig.partitionsSpec.partitionDimension',
@@ -2172,6 +2178,16 @@ export function updateSchemaWithSample(
     newSpec = deepDelete(newSpec, 'spec.dataSchema.metricsSpec');
   }
 
+  if (getSpecType(newSpec) === 'index_parallel') {
+    newSpec = adjustForceGuaranteedRollup(
+      deepSet(
+        newSpec,
+        'spec.tuningConfig.partitionsSpec',
+        rollup ? { type: 'hashed' } : { type: 'dynamic' },
+      ),
+    );
+  }
+
   newSpec = deepSet(newSpec, 'spec.dataSchema.granularitySpec.rollup', rollup);
   return newSpec;
 }
diff --git a/web-console/src/utils/object-change.ts b/web-console/src/utils/object-change.ts
index 7ff7d5e2fc8f..99e3166f9ca8 100644
--- a/web-console/src/utils/object-change.ts
+++ b/web-console/src/utils/object-change.ts
@@ -83,6 +83,11 @@ export function deepSet<T extends Record<string, any>>(value: T, path: string, x
   return valueCopy;
 }
 
+export function deepSetIfUnset<T extends Record<string, any>>(value: T, path: string, x: any): T {
+  if (typeof deepGet(value, path) !== 'undefined') return value;
+  return deepSet(value, path, x);
+}
+
 export function deepSetMulti<T extends Record<string, any>>(
   value: T,
   changes: Record<string, any>,
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 31bb54ca4970..15e7df035fce 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -68,6 +68,7 @@ import {
   INPUT_FORMAT_FIELDS,
   issueWithSampleData,
   METRIC_SPEC_FIELDS,
+  PRIMARY_PARTITION_RELATED_FORM_FIELDS,
   removeTimestampTransform,
   TIMESTAMP_SPEC_FIELDS,
   TimestampSpec,
@@ -76,7 +77,7 @@ import {
   updateSchemaWithSample,
 } from '../../druid-models';
 import {
-  adjustTuningConfig,
+  adjustForceGuaranteedRollup,
   cleanSpec,
   computeFlattenPathsForData,
   DimensionMode,
@@ -91,18 +92,17 @@ import {
   getIngestionTitle,
   getIoConfigFormFields,
   getIoConfigTuningFormFields,
-  getPartitionRelatedTuningSpecFormFields,
   getRequiredModule,
   getRollup,
+  getSecondaryPartitionRelatedFormFields,
   getSpecType,
   getTuningSpecFormFields,
-  GranularitySpec,
   IngestionComboTypeWithExtra,
   IngestionSpec,
   InputFormat,
   inputFormatCanFlatten,
   invalidIoConfig,
-  invalidTuningConfig,
+  invalidPartitionConfig,
   IoConfig,
   isDruidSource,
   isEmptyIngestionSpec,
@@ -125,6 +125,7 @@ import {
   deepDelete,
   deepGet,
   deepSet,
+  deepSetIfUnset,
   deepSetMulti,
   EMPTY_ARRAY,
   EMPTY_OBJECT,
@@ -509,9 +510,9 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
   };
 
   private applyPreviewSpec = () => {
-    this.setState(({ specPreview }) => {
+    this.setState(({ spec, specPreview }) => {
       localStorageSet(LocalStorageKeys.INGESTION_SPEC, JSON.stringify(specPreview));
-      return { spec: specPreview };
+      return { spec: spec === specPreview ? Object.assign({}, specPreview) : specPreview }; // If applying again, make a shallow copy to force a refresh
     });
   };
 
@@ -1886,17 +1887,16 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
 
             let newSpec = spec;
             if (!deepGet(newSpec, 'spec.dataSchema.dimensionsSpec')) {
+              const currentRollup = deepGet(newSpec, 'spec.dataSchema.granularitySpec.rollup');
               newSpec = updateSchemaWithSample(
                 newSpec,
                 transformQueryState.data,
                 'specific',
-                DEFAULT_ROLLUP_SETTING,
+                typeof currentRollup === 'boolean' ? currentRollup : DEFAULT_ROLLUP_SETTING,
               );
             }
 
-            if (!deepGet(newSpec, 'spec.dataSchema.granularitySpec.type')) {
-              newSpec = deepSet(newSpec, 'spec.dataSchema.granularitySpec.type', 'uniform');
-            }
+            newSpec = deepSetIfUnset(newSpec, 'spec.dataSchema.granularitySpec.type', 'uniform');
 
             this.updateSpec(newSpec);
             return true;
@@ -2522,19 +2522,6 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
         </div>
         {this.renderNextBar({
           disabled: !schemaQueryState.data,
-          onNextStep: () => {
-            let newSpec = spec;
-            if (rollup) {
-              newSpec = deepSet(newSpec, 'spec.tuningConfig.partitionsSpec', { type: 'hashed' });
-              newSpec = deepSet(newSpec, 'spec.tuningConfig.forceGuaranteedRollup', true);
-            } else {
-              newSpec = deepSet(newSpec, 'spec.tuningConfig.partitionsSpec', { type: 'dynamic' });
-              newSpec = deepDelete(newSpec, 'spec.tuningConfig.forceGuaranteedRollup');
-            }
-
-            this.updateSpec(newSpec);
-            return true;
-          },
         })}
       </>
     );
@@ -2920,8 +2907,6 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
   renderPartitionStep() {
     const { spec } = this.state;
     const tuningConfig: TuningConfig = deepGet(spec, 'spec.tuningConfig') || EMPTY_OBJECT;
-    const granularitySpec: GranularitySpec =
-      deepGet(spec, 'spec.dataSchema.granularitySpec') || EMPTY_OBJECT;
     const dimensions: (string | DimensionSpec)[] | undefined = deepGet(
       spec,
       'spec.dataSchema.dimensionsSpec.dimensions',
@@ -2990,33 +2975,17 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
         <div className="main">
           <H5>Primary partitioning (by time)</H5>
           <AutoForm
-            fields={[
-              {
-                name: 'segmentGranularity',
-                type: 'string',
-                suggestions: ['hour', 'day', 'week', 'month', 'year'],
-                defined: (g: GranularitySpec) => g.type === 'uniform',
-                required: true,
-                info: (
-                  <>
-                    The granularity to create time chunks at. Multiple segments can be created per
-                    time chunk. For example, with 'DAY' segmentGranularity, the events of the same
-                    day fall into the same time chunk which can be optionally further partitioned
-                    into multiple segments based on other configurations and input size.
-                  </>
-                ),
-              },
-            ]}
-            model={granularitySpec}
-            onChange={g => this.updateSpec(deepSet(spec, 'spec.dataSchema.granularitySpec', g))}
+            fields={PRIMARY_PARTITION_RELATED_FORM_FIELDS}
+            model={spec}
+            onChange={this.updateSpec}
           />
         </div>
         <div className="other">
           <H5>Secondary partitioning</H5>
           <AutoForm
-            fields={getPartitionRelatedTuningSpecFormFields(spec, dimensionNames)}
+            fields={getSecondaryPartitionRelatedFormFields(spec, dimensionNames)}
             model={spec}
-            globalAdjustment={adjustTuningConfig}
+            globalAdjustment={adjustForceGuaranteedRollup}
             onChange={this.updateSpec}
           />
         </div>
@@ -3025,7 +2994,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
           {nonsensicalSingleDimPartitioningMessage}
         </div>
         {this.renderNextBar({
-          disabled: !granularitySpec.segmentGranularity || invalidTuningConfig(tuningConfig),
+          disabled: invalidPartitionConfig(spec),
         })}
       </>
     );

From 04a2a2fbadab42ec9f5edd53e74564de2eaa7806 Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Sun, 6 Dec 2020 15:54:53 -0800
Subject: [PATCH 03/14] fix tests

---
 .../src/druid-models/ingestion-spec.spec.ts   | 66 ++++++++++++++++++-
 .../src/druid-models/ingestion-spec.tsx       |  7 +-
 .../views/load-data-view/load-data-view.tsx   |  1 +
 3 files changed, 70 insertions(+), 4 deletions(-)

diff --git a/web-console/src/druid-models/ingestion-spec.spec.ts b/web-console/src/druid-models/ingestion-spec.spec.ts
index fb6df068351f..1e061420918e 100644
--- a/web-console/src/druid-models/ingestion-spec.spec.ts
+++ b/web-console/src/druid-models/ingestion-spec.spec.ts
@@ -206,9 +206,14 @@ describe('spec utils', () => {
   });
 
   it('updateSchemaWithSample', () => {
-    expect(
-      updateSchemaWithSample(ingestionSpec, { header: ['header'], rows: [] }, 'specific', true),
-    ).toMatchInlineSnapshot(`
+    const withRollup = updateSchemaWithSample(
+      ingestionSpec,
+      { header: ['header'], rows: [] },
+      'specific',
+      true,
+    );
+
+    expect(withRollup).toMatchInlineSnapshot(`
       Object {
         "spec": Object {
           "dataSchema": Object {
@@ -248,6 +253,61 @@ describe('spec utils', () => {
             "type": "index_parallel",
           },
           "tuningConfig": Object {
+            "forceGuaranteedRollup": true,
+            "partitionsSpec": Object {
+              "type": "hashed",
+            },
+            "type": "index_parallel",
+          },
+        },
+        "type": "index_parallel",
+      }
+    `);
+
+    const noRollup = updateSchemaWithSample(
+      ingestionSpec,
+      { header: ['header'], rows: [] },
+      'specific',
+      false,
+    );
+
+    expect(noRollup).toMatchInlineSnapshot(`
+      Object {
+        "spec": Object {
+          "dataSchema": Object {
+            "dataSource": "wikipedia",
+            "dimensionsSpec": Object {
+              "dimensions": Array [
+                "header",
+              ],
+            },
+            "granularitySpec": Object {
+              "queryGranularity": "none",
+              "rollup": false,
+              "segmentGranularity": "day",
+              "type": "uniform",
+            },
+            "timestampSpec": Object {
+              "column": "timestamp",
+              "format": "iso",
+            },
+          },
+          "ioConfig": Object {
+            "inputFormat": Object {
+              "type": "json",
+            },
+            "inputSource": Object {
+              "type": "http",
+              "uris": Array [
+                "https://static.imply.io/data/wikipedia.json.gz",
+              ],
+            },
+            "type": "index_parallel",
+          },
+          "tuningConfig": Object {
+            "partitionsSpec": Object {
+              "type": "dynamic",
+            },
             "type": "index_parallel",
           },
         },
diff --git a/web-console/src/druid-models/ingestion-spec.tsx b/web-console/src/druid-models/ingestion-spec.tsx
index 2a93825b9aab..8efbddefade5 100644
--- a/web-console/src/druid-models/ingestion-spec.tsx
+++ b/web-console/src/druid-models/ingestion-spec.tsx
@@ -1364,6 +1364,7 @@ export function invalidPartitionConfig(spec: IngestionSpec): boolean {
 export const PRIMARY_PARTITION_RELATED_FORM_FIELDS: Field<IngestionSpec>[] = [
   {
     name: 'spec.dataSchema.granularitySpec.segmentGranularity',
+    label: 'Segment granularity',
     type: 'string',
     suggestions: ['hour', 'day', 'week', 'month', 'year'],
     defined: s => deepGet(s, 'spec.dataSchema.granularitySpec.type') === 'uniform',
@@ -2149,6 +2150,7 @@ export function updateSchemaWithSample(
   headerAndRows: HeaderAndRows,
   dimensionMode: DimensionMode,
   rollup: boolean,
+  forcePartitionInitialization = false,
 ): IngestionSpec {
   const typeHints = getTypeHintsFromSpec(spec);
 
@@ -2178,7 +2180,10 @@ export function updateSchemaWithSample(
     newSpec = deepDelete(newSpec, 'spec.dataSchema.metricsSpec');
   }
 
-  if (getSpecType(newSpec) === 'index_parallel') {
+  if (
+    getSpecType(newSpec) === 'index_parallel' &&
+    (!deepGet(newSpec, 'spec.tuningConfig.partitionsSpec') || forcePartitionInitialization)
+  ) {
     newSpec = adjustForceGuaranteedRollup(
       deepSet(
         newSpec,
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 15e7df035fce..8f6339015b15 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -2577,6 +2577,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
               headerAndRowsFromSampleResponse({ sampleResponse }),
               getDimensionMode(spec),
               newRollup,
+              true,
             ),
           );
         }}

From 11f7d6a3bba7f0642ee7d2fcf3596b8e604349b9 Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Mon, 7 Dec 2020 13:20:20 -0800
Subject: [PATCH 04/14] better filter control

---
 web-console/src/druid-models/filter.tsx       |  51 +++++-
 .../filter-table/filter-table.spec.tsx        |   1 -
 .../filter-table/filter-table.tsx             |  18 +-
 .../views/load-data-view/load-data-view.tsx   | 172 ++++++------------
 4 files changed, 105 insertions(+), 137 deletions(-)

diff --git a/web-console/src/druid-models/filter.tsx b/web-console/src/druid-models/filter.tsx
index 10791294063e..eea0647c327c 100644
--- a/web-console/src/druid-models/filter.tsx
+++ b/web-console/src/druid-models/filter.tsx
@@ -16,9 +16,14 @@
  * limitations under the License.
  */
 
-import { Field } from '../components';
+import React from 'react';
+
+import { ExternalLink, Field } from '../components';
+import { getLink } from '../links';
 import { deepGet, EMPTY_ARRAY, oneOf } from '../utils';
 
+import { IngestionSpec } from './ingestion-spec';
+
 export type DruidFilter = Record<string, any>;
 
 export interface DimensionFiltersWithRest {
@@ -30,7 +35,9 @@ export function splitFilter(filter: DruidFilter | null): DimensionFiltersWithRes
   const inputAndFilters: DruidFilter[] = filter
     ? filter.type === 'and' && Array.isArray(filter.fields)
       ? filter.fields
-      : [filter]
+      : filter.type !== 'true'
+      ? [filter]
+      : EMPTY_ARRAY
     : EMPTY_ARRAY;
   const dimensionFilters: DruidFilter[] = inputAndFilters.filter(
     f => typeof f.dimension === 'string',
@@ -119,3 +126,43 @@ export const FILTER_FIELDS: Field<DruidFilter>[] = [
       df.type === 'not' && oneOf(deepGet(df, 'field.type'), 'regex', 'like'),
   },
 ];
+
+export const FILTERS_FIELDS: Field<IngestionSpec>[] = [
+  {
+    name: 'spec.dataSchema.granularitySpec.intervals',
+    label: 'Time intervals',
+    type: 'string-array',
+    placeholder: 'ex: 2020-01-01/2020-06-01',
+    info: (
+      <>
+        <p>A comma separated list of intervals for the raw data being ingested.</p>
+        <p>
+          Explicitly specifying the list of intervals contained in the data will make some ingestion
+          jobs run faster.
+        </p>
+      </>
+    ),
+  },
+  {
+    name: 'spec.dataSchema.transformSpec.filter',
+    label: 'Filter',
+    type: 'json',
+    height: '350px',
+    placeholder: '{ "type": "true" }',
+    info: (
+      <>
+        <p>
+          A Druid{' '}
+          <ExternalLink href={`${getLink('DOCS')}/querying/filters.html`}>
+            JSON filter expression
+          </ExternalLink>{' '}
+          to apply to the data.
+        </p>
+        <p>
+          Note that only the value that match the filter will be included. If you want to remove
+          some data values you must negate the filter.
+        </p>
+      </>
+    ),
+  },
+];
diff --git a/web-console/src/views/load-data-view/filter-table/filter-table.spec.tsx b/web-console/src/views/load-data-view/filter-table/filter-table.spec.tsx
index 0c635b17947a..f023124877a4 100644
--- a/web-console/src/views/load-data-view/filter-table/filter-table.spec.tsx
+++ b/web-console/src/views/load-data-view/filter-table/filter-table.spec.tsx
@@ -39,7 +39,6 @@ describe('filter table', () => {
         columnFilter=""
         dimensionFilters={[]}
         selectedFilterName={undefined}
-        onShowGlobalFilter={() => {}}
         onFilterSelect={() => {}}
       />
     );
diff --git a/web-console/src/views/load-data-view/filter-table/filter-table.tsx b/web-console/src/views/load-data-view/filter-table/filter-table.tsx
index db0bddc3eedd..c64562a20556 100644
--- a/web-console/src/views/load-data-view/filter-table/filter-table.tsx
+++ b/web-console/src/views/load-data-view/filter-table/filter-table.tsx
@@ -42,19 +42,11 @@ export interface FilterTableProps {
   columnFilter: string;
   dimensionFilters: DruidFilter[];
   selectedFilterName: string | undefined;
-  onShowGlobalFilter: () => void;
   onFilterSelect: (filter: DruidFilter, index: number) => void;
 }
 
 export const FilterTable = React.memo(function FilterTable(props: FilterTableProps) {
-  const {
-    sampleData,
-    columnFilter,
-    dimensionFilters,
-    selectedFilterName,
-    onShowGlobalFilter,
-    onFilterSelect,
-  } = props;
+  const { sampleData, columnFilter, dimensionFilters, selectedFilterName, onFilterSelect } = props;
 
   return (
     <ReactTable
@@ -73,11 +65,11 @@ export const FilterTable = React.memo(function FilterTable(props: FilterTablePro
         return {
           Header: (
             <div
-              className={classNames('clickable')}
+              className={classNames({ clickable: !timestamp })}
               onClick={() => {
-                if (timestamp) {
-                  onShowGlobalFilter();
-                } else if (filter) {
+                if (timestamp) return;
+
+                if (filter) {
                   onFilterSelect(filter, filterIndex);
                 } else {
                   onFilterSelect({ type: 'selector', dimension: columnName, value: '' }, -1);
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 8f6339015b15..9674b4e8e235 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -60,6 +60,7 @@ import {
   CONSTANT_TIMESTAMP_SPEC_FIELDS,
   DIMENSION_SPEC_FIELDS,
   FILTER_FIELDS,
+  FILTERS_FIELDS,
   FLATTEN_FIELD_FIELDS,
   getDimensionSpecName,
   getMetricSpecName,
@@ -341,7 +342,6 @@ export interface LoadDataViewState {
   filterQueryState: QueryState<HeaderAndRows>;
   selectedFilterIndex: number;
   selectedFilter?: DruidFilter;
-  showGlobalFilter: boolean;
   newFilterValue?: Record<string, any>;
 
   // for schema
@@ -399,7 +399,6 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
       // for filter
       filterQueryState: QueryState.INIT,
       selectedFilterIndex: -1,
-      showGlobalFilter: false,
 
       // for dimensions
       schemaQueryState: QueryState.INIT,
@@ -2063,7 +2062,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
   });
 
   renderFilterStep() {
-    const { spec, columnFilter, filterQueryState, selectedFilter, showGlobalFilter } = this.state;
+    const { spec, columnFilter, filterQueryState, selectedFilter } = this.state;
     const dimensionFilters = this.getMemoizedDimensionFiltersFromSpec(spec);
 
     let mainFill: JSX.Element | string = '';
@@ -2086,7 +2085,6 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
               columnFilter={columnFilter}
               dimensionFilters={dimensionFilters}
               selectedFilterName={filterTableSelectedColumnName(data, selectedFilter)}
-              onShowGlobalFilter={this.onShowGlobalFilter}
               onFilterSelect={this.onFilterSelect}
             />
           )}
@@ -2103,18 +2101,30 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
         <div className="main">{mainFill}</div>
         <div className="control">
           <FilterMessage />
-          {!showGlobalFilter && this.renderColumnFilterControls()}
-          {!selectedFilter && this.renderGlobalFilterControls()}
+          {!selectedFilter && (
+            <>
+              <AutoForm fields={FILTERS_FIELDS} model={spec} onChange={this.updateSpecPreview} />
+              {this.renderApplyButtonBar(filterQueryState, undefined)}
+              <FormGroup>
+                <Button
+                  text="Add column filter"
+                  onClick={() => {
+                    this.setState({
+                      selectedFilter: { type: 'selector', dimension: '', value: '' },
+                      selectedFilterIndex: -1,
+                    });
+                  }}
+                />
+              </FormGroup>
+            </>
+          )}
+          {this.renderColumnFilterControls()}
         </div>
         {this.renderNextBar({})}
       </>
     );
   }
 
-  private onShowGlobalFilter = () => {
-    this.setState({ showGlobalFilter: true });
-  };
-
   private onFilterSelect = (filter: DruidFilter, index: number) => {
     this.setState({
       selectedFilterIndex: index,
@@ -2124,6 +2134,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
 
   renderColumnFilterControls() {
     const { spec, selectedFilter, selectedFilterIndex } = this.state;
+    if (!selectedFilter) return;
 
     const close = () => {
       this.setState({
@@ -2132,129 +2143,48 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
       });
     };
 
-    if (selectedFilter) {
-      return (
-        <div className="edit-controls">
-          <AutoForm
-            fields={FILTER_FIELDS}
-            model={selectedFilter}
-            onChange={f => this.setState({ selectedFilter: f })}
-            showCustom={f => !oneOf(f.type, 'selector', 'in', 'regex', 'like', 'not')}
-          />
-          <div className="control-buttons">
-            <Button
-              text="Apply"
-              intent={Intent.PRIMARY}
-              onClick={() => {
-                const curFilter = splitFilter(
-                  deepGet(spec, 'spec.dataSchema.transformSpec.filter'),
-                );
-                const newFilter = joinFilter(
-                  deepSet(curFilter, `dimensionFilters.${selectedFilterIndex}`, selectedFilter),
-                );
-                this.updateSpec(deepSet(spec, 'spec.dataSchema.transformSpec.filter', newFilter));
-                close();
-              }}
-            />
-            <Button text="Cancel" onClick={close} />
-            {selectedFilterIndex !== -1 && (
-              <Button
-                className="right"
-                icon={IconNames.TRASH}
-                intent={Intent.DANGER}
-                onClick={() => {
-                  const curFilter = splitFilter(
-                    deepGet(spec, 'spec.dataSchema.transformSpec.filter'),
-                  );
-                  const newFilter = joinFilter(
-                    deepDelete(curFilter, `dimensionFilters.${selectedFilterIndex}`),
-                  );
-                  this.updateSpec(deepSet(spec, 'spec.dataSchema.transformSpec.filter', newFilter));
-                  close();
-                }}
-              />
-            )}
-          </div>
-        </div>
-      );
-    } else {
-      return (
-        <FormGroup>
+    return (
+      <div className="edit-controls">
+        <AutoForm
+          fields={FILTER_FIELDS}
+          model={selectedFilter}
+          onChange={f => this.setState({ selectedFilter: f })}
+          showCustom={f => !oneOf(f.type, 'selector', 'in', 'regex', 'like', 'not')}
+        />
+        <div className="control-buttons">
           <Button
-            text="Add column filter"
+            text="Apply"
+            intent={Intent.PRIMARY}
             onClick={() => {
-              this.setState({
-                selectedFilter: { type: 'selector', dimension: '', value: '' },
-                selectedFilterIndex: -1,
-              });
+              const curFilter = splitFilter(deepGet(spec, 'spec.dataSchema.transformSpec.filter'));
+              const newFilter = joinFilter(
+                deepSet(curFilter, `dimensionFilters.${selectedFilterIndex}`, selectedFilter),
+              );
+              this.updateSpec(deepSet(spec, 'spec.dataSchema.transformSpec.filter', newFilter));
+              close();
             }}
           />
-        </FormGroup>
-      );
-    }
-  }
-
-  renderGlobalFilterControls() {
-    const { spec, showGlobalFilter, newFilterValue } = this.state;
-    const intervals: string[] = deepGet(spec, 'spec.dataSchema.granularitySpec.intervals');
-    const { restFilter } = splitFilter(deepGet(spec, 'spec.dataSchema.transformSpec.filter'));
-    const hasGlobalFilter = Boolean(intervals || restFilter);
-
-    if (showGlobalFilter) {
-      return (
-        <div className="edit-controls">
-          <AutoForm
-            fields={[
-              {
-                name: 'spec.dataSchema.granularitySpec.intervals',
-                label: 'Time intervals',
-                type: 'string-array',
-                placeholder: 'ex: 2018-01-01/2018-06-01',
-                info: <>A comma separated list of intervals for the raw data being ingested.</>,
-              },
-            ]}
-            model={spec}
-            onChange={this.updateSpec}
-          />
-          <FormGroup label="Extra filter">
-            <JsonInput
-              value={newFilterValue}
-              onChange={f => this.setState({ newFilterValue: f })}
-              height="200px"
-            />
-          </FormGroup>
-          <div className="control-buttons">
+          <Button text="Cancel" onClick={close} />
+          {selectedFilterIndex !== -1 && (
             <Button
-              text="Apply"
-              intent={Intent.PRIMARY}
+              className="right"
+              icon={IconNames.TRASH}
+              intent={Intent.DANGER}
               onClick={() => {
                 const curFilter = splitFilter(
                   deepGet(spec, 'spec.dataSchema.transformSpec.filter'),
                 );
-                const newFilter = joinFilter(deepSet(curFilter, `restFilter`, newFilterValue));
+                const newFilter = joinFilter(
+                  deepDelete(curFilter, `dimensionFilters.${selectedFilterIndex}`),
+                );
                 this.updateSpec(deepSet(spec, 'spec.dataSchema.transformSpec.filter', newFilter));
-                this.setState({ showGlobalFilter: false, newFilterValue: undefined });
+                close();
               }}
             />
-            <Button text="Cancel" onClick={() => this.setState({ showGlobalFilter: false })} />
-          </div>
+          )}
         </div>
-      );
-    } else {
-      return (
-        <FormGroup>
-          <Button
-            text={`${hasGlobalFilter ? 'Edit' : 'Add'} global filter`}
-            onClick={() =>
-              this.setState({
-                showGlobalFilter: true,
-                newFilterValue: restFilter,
-              })
-            }
-          />
-        </FormGroup>
-      );
-    }
+      </div>
+    );
   }
 
   // ==================================================================
@@ -2479,7 +2409,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
                   },
                 ]}
                 model={spec}
-                onChange={s => this.updateSpecPreview(s)}
+                onChange={this.updateSpecPreview}
                 onFinalize={this.applyPreviewSpec}
               />
               <FormGroup>

From c182c6503e502eccab9b6fa57a4f3db5118a988a Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Mon, 7 Dec 2020 13:32:23 -0800
Subject: [PATCH 05/14] work with not

---
 web-console/src/druid-models/filter.tsx             | 13 +++++++++++--
 .../load-data-view/filter-table/filter-table.tsx    |  4 ++--
 2 files changed, 13 insertions(+), 4 deletions(-)

diff --git a/web-console/src/druid-models/filter.tsx b/web-console/src/druid-models/filter.tsx
index eea0647c327c..882fdd8d6757 100644
--- a/web-console/src/druid-models/filter.tsx
+++ b/web-console/src/druid-models/filter.tsx
@@ -39,10 +39,13 @@ export function splitFilter(filter: DruidFilter | null): DimensionFiltersWithRes
       ? [filter]
       : EMPTY_ARRAY
     : EMPTY_ARRAY;
+
   const dimensionFilters: DruidFilter[] = inputAndFilters.filter(
-    f => typeof f.dimension === 'string',
+    f => typeof getFilterDimension(f) === 'string',
+  );
+  const restFilters: DruidFilter[] = inputAndFilters.filter(
+    f => typeof getFilterDimension(f) !== 'string',
   );
-  const restFilters: DruidFilter[] = inputAndFilters.filter(f => typeof f.dimension !== 'string');
 
   return {
     dimensionFilters,
@@ -66,6 +69,12 @@ export function joinFilter(
   return { type: 'and', fields: newFields };
 }
 
+export function getFilterDimension(filter: DruidFilter): string | undefined {
+  if (typeof filter.dimension === 'string') return filter.dimension;
+  if (filter.type === 'not' && filter.field) return getFilterDimension(filter.field);
+  return;
+}
+
 export const FILTER_FIELDS: Field<DruidFilter>[] = [
   {
     name: 'type',
diff --git a/web-console/src/views/load-data-view/filter-table/filter-table.tsx b/web-console/src/views/load-data-view/filter-table/filter-table.tsx
index c64562a20556..97958b456a60 100644
--- a/web-console/src/views/load-data-view/filter-table/filter-table.tsx
+++ b/web-console/src/views/load-data-view/filter-table/filter-table.tsx
@@ -21,7 +21,7 @@ import React from 'react';
 import ReactTable from 'react-table';
 
 import { TableCell } from '../../../components';
-import { DruidFilter } from '../../../druid-models';
+import { DruidFilter, getFilterDimension } from '../../../druid-models';
 import { caseInsensitiveContains, filterMap } from '../../../utils';
 import { HeaderAndRows, SampleEntry } from '../../../utils/sampler';
 
@@ -55,7 +55,7 @@ export const FilterTable = React.memo(function FilterTable(props: FilterTablePro
       columns={filterMap(sampleData.header, (columnName, i) => {
         if (!caseInsensitiveContains(columnName, columnFilter)) return;
         const timestamp = columnName === '__time';
-        const filterIndex = dimensionFilters.findIndex(f => f.dimension === columnName);
+        const filterIndex = dimensionFilters.findIndex(f => getFilterDimension(f) === columnName);
         const filter = dimensionFilters[filterIndex];
 
         const columnClassName = classNames({

From 3512956e10221b4ef6774a12bc3a5e791b0d33cf Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Mon, 7 Dec 2020 14:55:04 -0800
Subject: [PATCH 06/14] wrap callout with form group

---
 .../src/druid-models/ingestion-spec.tsx       |  31 +--
 .../load-data-view.spec.tsx.snap              |   4 +-
 .../views/load-data-view/info-messages.tsx    | 210 ++++++++++--------
 .../views/load-data-view/load-data-view.scss  |   8 +-
 .../views/load-data-view/load-data-view.tsx   | 100 +++++----
 5 files changed, 186 insertions(+), 167 deletions(-)

diff --git a/web-console/src/druid-models/ingestion-spec.tsx b/web-console/src/druid-models/ingestion-spec.tsx
index 8efbddefade5..a1783fb13115 100644
--- a/web-console/src/druid-models/ingestion-spec.tsx
+++ b/web-console/src/druid-models/ingestion-spec.tsx
@@ -1387,7 +1387,7 @@ export function getSecondaryPartitionRelatedFormFields(
   const specType = getSpecType(spec);
   switch (specType) {
     case 'index_parallel':
-      const parallelFields: Field<IngestionSpec>[] = [
+      return [
         {
           name: 'spec.tuningConfig.partitionsSpec.type',
           label: 'Partitioning type',
@@ -1557,28 +1557,6 @@ export function getSecondaryPartitionRelatedFormFields(
         },
       ];
 
-      if (oneOf(deepGet(spec, 'spec.tuningConfig.partitionsSpec.type'), 'hashed', 'single_dim')) {
-        parallelFields.push({
-          name: 'spec.dataSchema.granularitySpec.intervals',
-          label: 'Time intervals',
-          type: 'string-array',
-          placeholder: 'ex: 2018-01-01/2018-06-01',
-          hideInMore: true,
-          info: (
-            <>
-              <p>A comma separated list of intervals for the raw data being ingested.</p>
-              <p>
-                This list is used to determine the shards that will be created. If it is not
-                specified then then an additional job will run to automatically determine the data
-                intervals used.
-              </p>
-            </>
-          ),
-        });
-      }
-
-      return parallelFields;
-
     case 'kafka':
     case 'kinesis':
       return [
@@ -1602,6 +1580,13 @@ export function getSecondaryPartitionRelatedFormFields(
   throw new Error(`unknown spec type ${specType}`);
 }
 
+export function settingIntervalsWouldSpeedUpIngestion(spec: IngestionSpec): boolean {
+  return (
+    oneOf(deepGet(spec, 'spec.tuningConfig.partitionsSpec.type'), 'hashed', 'single_dim') &&
+    !deepGet(spec, 'spec.dataSchema.granularitySpec.intervals')
+  );
+}
+
 const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
   {
     name: 'maxNumConcurrentSubTasks',
diff --git a/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap b/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap
index ef5cec674717..e363ecc4a66c 100644
--- a/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap
+++ b/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap
@@ -173,9 +173,7 @@ exports[`load data view matches snapshot 1`] = `
   <div
     className="control"
   >
-    <Blueprint3.Callout
-      className="intro"
-    >
+    <Blueprint3.Callout>
       <p>
         Please specify where your raw data is located
       </p>
diff --git a/web-console/src/views/load-data-view/info-messages.tsx b/web-console/src/views/load-data-view/info-messages.tsx
index 217c84200caf..ee53ae77b3e4 100644
--- a/web-console/src/views/load-data-view/info-messages.tsx
+++ b/web-console/src/views/load-data-view/info-messages.tsx
@@ -16,7 +16,7 @@
  * limitations under the License.
  */
 
-import { Callout, Code } from '@blueprintjs/core';
+import { Callout, Code, FormGroup } from '@blueprintjs/core';
 import React from 'react';
 
 import { ExternalLink } from '../../components';
@@ -34,22 +34,26 @@ export const ConnectMessage = React.memo(function ConnectMessage(props: ConnectM
   const { inlineMode, spec } = props;
 
   return (
-    <Callout className="intro">
-      <p>
-        Druid ingests raw data and converts it into a custom,{' '}
-        <ExternalLink href={`${getLink('DOCS')}/design/segments.html`}>indexed format</ExternalLink>{' '}
-        that is optimized for analytic queries.
-      </p>
-      {inlineMode ? (
-        <>
-          <p>To get started, please paste some data in the box to the left.</p>
-          <p>Click "Apply" to verify your data with Druid.</p>
-        </>
-      ) : (
-        <p>To get started, please specify what data you want to ingest.</p>
-      )}
-      <LearnMore href={getIngestionDocLink(spec)} />
-    </Callout>
+    <FormGroup>
+      <Callout>
+        <p>
+          Druid ingests raw data and converts it into a custom,{' '}
+          <ExternalLink href={`${getLink('DOCS')}/design/segments.html`}>
+            indexed format
+          </ExternalLink>{' '}
+          that is optimized for analytic queries.
+        </p>
+        {inlineMode ? (
+          <>
+            <p>To get started, please paste some data in the box to the left.</p>
+            <p>Click "Apply" to verify your data with Druid.</p>
+          </>
+        ) : (
+          <p>To get started, please specify what data you want to ingest.</p>
+        )}
+        <LearnMore href={getIngestionDocLink(spec)} />
+      </Callout>
+    </FormGroup>
   );
 });
 
@@ -61,69 +65,78 @@ export const ParserMessage = React.memo(function ParserMessage(props: ParserMess
   const { canFlatten } = props;
 
   return (
-    <Callout className="intro">
-      <p>
-        Druid requires flat data (non-nested, non-hierarchical). Each row should represent a
-        discrete event.
-      </p>
-      {canFlatten && (
+    <FormGroup>
+      <Callout>
         <p>
-          If you have nested data, you can{' '}
-          <ExternalLink href={`${getLink('DOCS')}/ingestion/index.html#flattenspec`}>
-            flatten
-          </ExternalLink>{' '}
-          it here. If the provided flattening capabilities are not sufficient, please pre-process
-          your data before ingesting it into Druid.
+          Druid requires flat data (non-nested, non-hierarchical). Each row should represent a
+          discrete event.
         </p>
-      )}
-      <p>Ensure that your data appears correctly in a row/column orientation.</p>
-      <LearnMore href={`${getLink('DOCS')}/ingestion/data-formats.html`} />
-    </Callout>
+        {canFlatten && (
+          <p>
+            If you have nested data, you can{' '}
+            <ExternalLink href={`${getLink('DOCS')}/ingestion/index.html#flattenspec`}>
+              flatten
+            </ExternalLink>{' '}
+            it here. If the provided flattening capabilities are not sufficient, please pre-process
+            your data before ingesting it into Druid.
+          </p>
+        )}
+        <p>Ensure that your data appears correctly in a row/column orientation.</p>
+        <LearnMore href={`${getLink('DOCS')}/ingestion/data-formats.html`} />
+      </Callout>
+    </FormGroup>
   );
 });
 
 export const TimestampMessage = React.memo(function TimestampMessage() {
   return (
-    <Callout className="intro">
-      <p>
-        Druid partitions data based on the primary time column of your data. This column is stored
-        internally in Druid as <Code>__time</Code>.
-      </p>
-      <p>Configure how to define the time column for this data.</p>
-      <p>
-        If your data does not have a time column, you can select <Code>None</Code> to use a
-        placeholder value. If the time information is spread across multiple columns you can combine
-        them into one by selecting <Code>Expression</Code> and defining a transform expression.
-      </p>
-      <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#timestampspec`} />
-    </Callout>
+    <FormGroup>
+      <Callout>
+        <p>
+          Druid partitions data based on the primary time column of your data. This column is stored
+          internally in Druid as <Code>__time</Code>.
+        </p>
+        <p>Configure how to define the time column for this data.</p>
+        <p>
+          If your data does not have a time column, you can select <Code>None</Code> to use a
+          placeholder value. If the time information is spread across multiple columns you can
+          combine them into one by selecting <Code>Expression</Code> and defining a transform
+          expression.
+        </p>
+        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#timestampspec`} />
+      </Callout>
+    </FormGroup>
   );
 });
 
 export const TransformMessage = React.memo(function TransformMessage() {
   return (
-    <Callout className="intro">
-      <p>
-        Druid can perform per-row{' '}
-        <ExternalLink href={`${getLink('DOCS')}/ingestion/transform-spec.html#transforms`}>
-          transforms
-        </ExternalLink>{' '}
-        of column values allowing you to create new derived columns or alter existing column.
-      </p>
-      <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#transforms`} />
-    </Callout>
+    <FormGroup>
+      <Callout>
+        <p>
+          Druid can perform per-row{' '}
+          <ExternalLink href={`${getLink('DOCS')}/ingestion/transform-spec.html#transforms`}>
+            transforms
+          </ExternalLink>{' '}
+          of column values allowing you to create new derived columns or alter existing column.
+        </p>
+        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#transforms`} />
+      </Callout>
+    </FormGroup>
   );
 });
 
 export const FilterMessage = React.memo(function FilterMessage() {
   return (
-    <Callout className="intro">
-      <p>
-        Druid can filter out unwanted data by applying per-row{' '}
-        <ExternalLink href={`${getLink('DOCS')}/querying/filters.html`}>filters</ExternalLink>.
-      </p>
-      <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#filter`} />
-    </Callout>
+    <FormGroup>
+      <Callout>
+        <p>
+          Druid can filter out unwanted data by applying per-row{' '}
+          <ExternalLink href={`${getLink('DOCS')}/querying/filters.html`}>filters</ExternalLink>.
+        </p>
+        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#filter`} />
+      </Callout>
+    </FormGroup>
   );
 });
 
@@ -135,57 +148,68 @@ export const SchemaMessage = React.memo(function SchemaMessage(props: SchemaMess
   const { dimensionMode } = props;
 
   return (
-    <Callout className="intro">
-      <p>
-        Each column in Druid must have an assigned type (string, long, float, double, complex, etc).
-      </p>
-      {dimensionMode === 'specific' && (
+    <FormGroup>
+      <Callout>
         <p>
-          Default primitive types have been automatically assigned to your columns. If you want to
-          change the type, click on the column header.
+          Each column in Druid must have an assigned type (string, long, float, double, complex,
+          etc).
         </p>
-      )}
-      <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design.html`} />
-    </Callout>
+        {dimensionMode === 'specific' && (
+          <p>
+            Default primitive types have been automatically assigned to your columns. If you want to
+            change the type, click on the column header.
+          </p>
+        )}
+        <LearnMore href={`${getLink('DOCS')}/ingestion/schema-design.html`} />
+      </Callout>
+    </FormGroup>
   );
 });
 
 export const PartitionMessage = React.memo(function PartitionMessage() {
   return (
-    <Callout className="intro">
-      <p>Configure how Druid will partition data.</p>
-      <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#partitioning`} />
-    </Callout>
+    <FormGroup>
+      <Callout>
+        <p>Configure how Druid will partition data.</p>
+        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#partitioning`} />
+      </Callout>
+    </FormGroup>
   );
 });
 
 export const TuningMessage = React.memo(function TuningMessage() {
   return (
-    <Callout className="intro">
-      <p>Fine tune how Druid will ingest data.</p>
-      <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#tuningconfig`} />
-    </Callout>
+    <FormGroup>
+      <Callout>
+        <p>Fine tune how Druid will ingest data.</p>
+        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#tuningconfig`} />
+      </Callout>
+    </FormGroup>
   );
 });
 
 export const PublishMessage = React.memo(function PublishMessage() {
   return (
-    <Callout className="intro">
-      <p>Configure behavior of indexed data once it reaches Druid.</p>
-    </Callout>
+    <FormGroup>
+      <Callout>
+        <p>Configure behavior of indexed data once it reaches Druid.</p>
+      </Callout>
+    </FormGroup>
   );
 });
 
 export const SpecMessage = React.memo(function SpecMessage() {
   return (
-    <Callout className="intro">
-      <p>
-        Druid begins ingesting data once you submit a JSON ingestion spec. If you modify any values
-        in this view, the values entered in previous sections will update accordingly. If you modify
-        any values in previous sections, this spec will automatically update.
-      </p>
-      <p>Submit the spec to begin loading data into Druid.</p>
-      <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#ingestion-specs`} />
-    </Callout>
+    <FormGroup>
+      <Callout>
+        <p>
+          Druid begins ingesting data once you submit a JSON ingestion spec. If you modify any
+          values in this view, the values entered in previous sections will update accordingly. If
+          you modify any values in previous sections, this spec will automatically update.
+        </p>
+        <p>Submit the spec to begin loading data into Druid.</p>
+        <LearnMore href={`${getLink('DOCS')}/ingestion/index.html#ingestion-specs`} />
+      </Callout>
+    </FormGroup>
   );
 });
diff --git a/web-console/src/views/load-data-view/load-data-view.scss b/web-console/src/views/load-data-view/load-data-view.scss
index bbc8627e8d16..8c4ec58797ba 100644
--- a/web-console/src/views/load-data-view/load-data-view.scss
+++ b/web-console/src/views/load-data-view/load-data-view.scss
@@ -277,12 +277,8 @@ $actual-icon-height: 400px;
     overflow: auto;
     padding: 0 5px;
 
-    .intro {
-      margin-bottom: 15px;
-
-      .optional {
-        font-style: italic;
-      }
+    .optional {
+      font-style: italic;
     }
   }
 
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 9674b4e8e235..4ee62e15e569 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -71,6 +71,7 @@ import {
   METRIC_SPEC_FIELDS,
   PRIMARY_PARTITION_RELATED_FORM_FIELDS,
   removeTimestampTransform,
+  settingIntervalsWouldSpeedUpIngestion,
   TIMESTAMP_SPEC_FIELDS,
   TimestampSpec,
   Transform,
@@ -761,7 +762,11 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
           </div>
         </div>
         <div className="control">
-          {welcomeMessage && <Callout className="intro">{welcomeMessage}</Callout>}
+          {welcomeMessage && (
+            <FormGroup>
+              <Callout>{welcomeMessage}</Callout>
+            </FormGroup>
+          )}
           {this.renderWelcomeStepControls()}
           {!isEmptyIngestionSpec(spec) && (
             <Button icon={IconNames.RESET} text="Reset spec" onClick={this.handleResetConfirm} />
@@ -2856,48 +2861,50 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
     ) {
       const firstDimensionName = dimensionNames[0];
       nonsensicalSingleDimPartitioningMessage = (
-        <Callout intent={Intent.WARNING}>
-          <p>Your partitioning and sorting configuration does not make sense.</p>
-          <p>
-            For best performance the first dimension in your schema (
-            <Code>{firstDimensionName}</Code>), which is what the data will be primarily sorted on,
-            should match the partitioning dimension (<Code>{partitionDimension}</Code>).
-          </p>
-          <p>
-            <Button
-              intent={Intent.WARNING}
-              text={`Put '${partitionDimension}' first in the dimensions list`}
-              onClick={() => {
-                this.updateSpec(
-                  deepSet(
-                    spec,
-                    'spec.dataSchema.dimensionsSpec.dimensions',
-                    moveElement(
-                      dimensions,
-                      dimensions.findIndex(d => getDimensionSpecName(d) === partitionDimension),
-                      0,
+        <FormGroup>
+          <Callout intent={Intent.WARNING}>
+            <p>Your partitioning and sorting configuration does not make sense.</p>
+            <p>
+              For best performance the first dimension in your schema (
+              <Code>{firstDimensionName}</Code>), which is what the data will be primarily sorted
+              on, should match the partitioning dimension (<Code>{partitionDimension}</Code>).
+            </p>
+            <p>
+              <Button
+                intent={Intent.WARNING}
+                text={`Put '${partitionDimension}' first in the dimensions list`}
+                onClick={() => {
+                  this.updateSpec(
+                    deepSet(
+                      spec,
+                      'spec.dataSchema.dimensionsSpec.dimensions',
+                      moveElement(
+                        dimensions,
+                        dimensions.findIndex(d => getDimensionSpecName(d) === partitionDimension),
+                        0,
+                      ),
                     ),
-                  ),
-                );
-              }}
-            />
-          </p>
-          <p>
-            <Button
-              intent={Intent.WARNING}
-              text={`Partition on '${firstDimensionName}' instead`}
-              onClick={() => {
-                this.updateSpec(
-                  deepSet(
-                    spec,
-                    'spec.tuningConfig.partitionsSpec.partitionDimension',
-                    firstDimensionName,
-                  ),
-                );
-              }}
-            />
-          </p>
-        </Callout>
+                  );
+                }}
+              />
+            </p>
+            <p>
+              <Button
+                intent={Intent.WARNING}
+                text={`Partition on '${firstDimensionName}' instead`}
+                onClick={() => {
+                  this.updateSpec(
+                    deepSet(
+                      spec,
+                      'spec.tuningConfig.partitionsSpec.partitionDimension',
+                      firstDimensionName,
+                    ),
+                  );
+                }}
+              />
+            </p>
+          </Callout>
+        </FormGroup>
       );
     }
 
@@ -2923,6 +2930,15 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
         <div className="control">
           <PartitionMessage />
           {nonsensicalSingleDimPartitioningMessage}
+          {settingIntervalsWouldSpeedUpIngestion(spec) && (
+            <FormGroup>
+              <Callout icon={IconNames.LIGHTBULB}>
+                You can make this ingestion run slightly faster by explicitly specifying the time
+                intervals for this dataset from the{' '}
+                <a onClick={() => this.updateStep('filter')}>Filter step</a>.
+              </Callout>
+            </FormGroup>
+          )}
         </div>
         {this.renderNextBar({
           disabled: invalidPartitionConfig(spec),

From 824e3eb86e36d4032655008378cfab6b0e1c5ecc Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Mon, 7 Dec 2020 15:06:26 -0800
Subject: [PATCH 07/14] update snapshot

---
 .../__snapshots__/load-data-view.spec.tsx.snap       | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap b/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap
index e363ecc4a66c..26f4700e1e50 100644
--- a/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap
+++ b/web-console/src/views/load-data-view/__snapshots__/load-data-view.spec.tsx.snap
@@ -173,11 +173,13 @@ exports[`load data view matches snapshot 1`] = `
   <div
     className="control"
   >
-    <Blueprint3.Callout>
-      <p>
-        Please specify where your raw data is located
-      </p>
-    </Blueprint3.Callout>
+    <Blueprint3.FormGroup>
+      <Blueprint3.Callout>
+        <p>
+          Please specify where your raw data is located
+        </p>
+      </Blueprint3.Callout>
+    </Blueprint3.FormGroup>
   </div>
 </div>
 `;

From dfc583cd1f5a217d017c9590756413964f9a1c4c Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Mon, 7 Dec 2020 17:50:28 -0800
Subject: [PATCH 08/14] add split hint

---
 .../src/components/auto-form/auto-form.tsx    |   3 +-
 .../compaction-dialog.spec.tsx.snap           | 212 ++++++++++--------
 .../lookup-edit-dialog.spec.tsx.snap          |  19 --
 .../src/druid-models/compaction-config.tsx    |  66 +++---
 web-console/src/druid-models/filter.tsx       |   1 -
 .../src/druid-models/ingestion-spec.tsx       | 177 ++++++++-------
 web-console/src/druid-models/lookup-spec.tsx  |  29 +--
 .../views/load-data-view/load-data-view.tsx   |  11 +-
 8 files changed, 272 insertions(+), 246 deletions(-)

diff --git a/web-console/src/components/auto-form/auto-form.tsx b/web-console/src/components/auto-form/auto-form.tsx
index 51e910829b0e..d31339a74f65 100644
--- a/web-console/src/components/auto-form/auto-form.tsx
+++ b/web-console/src/components/auto-form/auto-form.tsx
@@ -82,7 +82,8 @@ export class AutoForm<T extends Record<string, any>> extends React.PureComponent
   static REQUIRED_INTENT = Intent.PRIMARY;
 
   static makeLabelName(label: string): string {
-    let newLabel = label
+    const parts = label.split('.');
+    let newLabel = parts[parts.length - 1]
       .split(/(?=[A-Z])/)
       .join(' ')
       .toLowerCase()
diff --git a/web-console/src/dialogs/compaction-dialog/__snapshots__/compaction-dialog.spec.tsx.snap b/web-console/src/dialogs/compaction-dialog/__snapshots__/compaction-dialog.spec.tsx.snap
index e03e12a0373d..ba969a43086e 100644
--- a/web-console/src/dialogs/compaction-dialog/__snapshots__/compaction-dialog.spec.tsx.snap
+++ b/web-console/src/dialogs/compaction-dialog/__snapshots__/compaction-dialog.spec.tsx.snap
@@ -63,7 +63,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (dynamic partit
             "info": <React.Fragment>
               Determines how many rows are in each segment.
             </React.Fragment>,
-            "label": "Max rows per segment",
             "name": "tuningConfig.partitionsSpec.maxRowsPerSegment",
             "type": "number",
           },
@@ -73,7 +72,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (dynamic partit
             "info": <React.Fragment>
               Total number of rows in segments waiting for being pushed.
             </React.Fragment>,
-            "label": "Max total rows",
             "name": "tuningConfig.partitionsSpec.maxTotalRows",
             "type": "number",
           },
@@ -87,7 +85,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (dynamic partit
                 A target row count for each partition. Each partition will have a row count close to the target assuming evenly distributed keys. Defaults to 5 million if numShards is null.
               </p>
             </React.Fragment>,
-            "label": "Target rows per segment",
             "name": "tuningConfig.partitionsSpec.targetRowsPerSegment",
             "type": "number",
             "zeroMeansUndefined": true,
@@ -102,7 +99,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (dynamic partit
                 Directly specify the number of shards to create. If this is specified and 'intervals' is specified in the granularitySpec, the index task can skip the determine intervals/partitions pass through the data.
               </p>
             </React.Fragment>,
-            "label": "Num shards",
             "name": "tuningConfig.partitionsSpec.numShards",
             "type": "number",
             "zeroMeansUndefined": true,
@@ -112,7 +108,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (dynamic partit
             "info": <p>
               The dimensions to partition on. Leave blank to select all dimensions.
             </p>,
-            "label": "Partition dimensions",
             "name": "tuningConfig.partitionsSpec.partitionDimensions",
             "placeholder": "(all dimensions)",
             "type": "string-array",
@@ -122,7 +117,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (dynamic partit
             "info": <p>
               The dimension to partition on.
             </p>,
-            "label": "Partition dimension",
             "name": "tuningConfig.partitionsSpec.partitionDimension",
             "required": true,
             "type": "string",
@@ -132,7 +126,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (dynamic partit
             "info": <p>
               Target number of rows to include in a partition, should be a number that targets segments of 500MB~1GB.
             </p>,
-            "label": "Target rows per segment",
             "name": "tuningConfig.partitionsSpec.targetRowsPerSegment",
             "required": [Function],
             "type": "number",
@@ -143,7 +136,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (dynamic partit
             "info": <p>
               Maximum number of rows to include in a partition.
             </p>,
-            "label": "Max rows per segment",
             "name": "tuningConfig.partitionsSpec.maxRowsPerSegment",
             "required": [Function],
             "type": "number",
@@ -155,48 +147,65 @@ exports[`CompactionDialog matches snapshot with compactionConfig (dynamic partit
             "info": <p>
               Assume that input data has already been grouped on time and dimensions. Ingestion will run faster, but may choose sub-optimal partitions if this assumption is violated.
             </p>,
-            "label": "Assume grouped",
             "name": "tuningConfig.partitionsSpec.assumeGrouped",
             "type": "boolean",
           },
+          Object {
+            "defaultValue": 419430400,
+            "info": <p>
+              Maximum number of total segment bytes processed per compaction task. Since a time chunk must be processed in its entirety, if the segments for a particular time chunk have a total size in bytes greater than this parameter, compaction will not run for that time chunk. Because each compaction task runs with a single thread, setting this value too far above 1–2GB will result in compaction tasks taking an excessive amount of time.
+            </p>,
+            "name": "inputSegmentSizeBytes",
+            "type": "number",
+          },
           Object {
             "defaultValue": 1,
             "info": <React.Fragment>
               Maximum number of tasks which can be run at the same time. The supervisor task would spawn worker tasks up to maxNumConcurrentSubTasks regardless of the available task slots. If this value is set to 1, the supervisor task processes data ingestion on its own instead of spawning worker tasks. If this value is set to too large, too many worker tasks can be created which might block other ingestion.
             </React.Fragment>,
-            "label": "Max num concurrent sub tasks",
             "min": 1,
             "name": "tuningConfig.maxNumConcurrentSubTasks",
             "type": "number",
           },
-          Object {
-            "defaultValue": 419430400,
-            "info": <p>
-              Maximum number of total segment bytes processed per compaction task. Since a time chunk must be processed in its entirety, if the segments for a particular time chunk have a total size in bytes greater than this parameter, compaction will not run for that time chunk. Because each compaction task runs with a single thread, setting this value too far above 1–2GB will result in compaction tasks taking an excessive amount of time.
-            </p>,
-            "name": "inputSegmentSizeBytes",
-            "type": "number",
-          },
           Object {
             "defaultValue": 10,
             "defined": [Function],
             "info": <React.Fragment>
               Maximum number of merge tasks which can be run at the same time.
             </React.Fragment>,
-            "label": "Total num merge tasks",
             "min": 1,
             "name": "tuningConfig.totalNumMergeTasks",
             "type": "number",
           },
           Object {
             "adjustment": [Function],
-            "defaultValue": 500000000,
+            "defaultValue": 1073741824,
+            "hideInMore": true,
             "info": <React.Fragment>
               Maximum number of bytes of input segments to process in a single task. If a single segment is larger than this number, it will be processed by itself in a single task (input segments are never split across tasks).
             </React.Fragment>,
-            "label": "Max input segment bytes per task",
             "min": 1000000,
-            "name": "tuningConfig.splitHintSpec.maxInputSegmentBytesPerTask",
+            "name": "tuningConfig.splitHintSpec.maxSplitSize",
+            "type": "number",
+          },
+          Object {
+            "adjustment": [Function],
+            "defaultValue": 1000,
+            "hideInMore": true,
+            "info": <React.Fragment>
+              Maximum number of input segments to process in a single subtask. This limit is to avoid task failures when the ingestion spec is too long. There are two known limits on the max size of serialized ingestion spec, i.e., the max ZNode size in ZooKeeper (
+              <Unknown>
+                jute.maxbuffer
+              </Unknown>
+              ) and the max packet size in MySQL (
+              <Unknown>
+                max_allowed_packet
+              </Unknown>
+              ). These can make ingestion tasks fail if the serialized ingestion spec size hits one of them.
+            </React.Fragment>,
+            "label": "Max num files (segments)",
+            "min": 1,
+            "name": "tuningConfig.splitHintSpec.maxNumFiles",
             "type": "number",
           },
         ]
@@ -303,7 +312,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (hashed partiti
             "info": <React.Fragment>
               Determines how many rows are in each segment.
             </React.Fragment>,
-            "label": "Max rows per segment",
             "name": "tuningConfig.partitionsSpec.maxRowsPerSegment",
             "type": "number",
           },
@@ -313,7 +321,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (hashed partiti
             "info": <React.Fragment>
               Total number of rows in segments waiting for being pushed.
             </React.Fragment>,
-            "label": "Max total rows",
             "name": "tuningConfig.partitionsSpec.maxTotalRows",
             "type": "number",
           },
@@ -327,7 +334,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (hashed partiti
                 A target row count for each partition. Each partition will have a row count close to the target assuming evenly distributed keys. Defaults to 5 million if numShards is null.
               </p>
             </React.Fragment>,
-            "label": "Target rows per segment",
             "name": "tuningConfig.partitionsSpec.targetRowsPerSegment",
             "type": "number",
             "zeroMeansUndefined": true,
@@ -342,7 +348,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (hashed partiti
                 Directly specify the number of shards to create. If this is specified and 'intervals' is specified in the granularitySpec, the index task can skip the determine intervals/partitions pass through the data.
               </p>
             </React.Fragment>,
-            "label": "Num shards",
             "name": "tuningConfig.partitionsSpec.numShards",
             "type": "number",
             "zeroMeansUndefined": true,
@@ -352,7 +357,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (hashed partiti
             "info": <p>
               The dimensions to partition on. Leave blank to select all dimensions.
             </p>,
-            "label": "Partition dimensions",
             "name": "tuningConfig.partitionsSpec.partitionDimensions",
             "placeholder": "(all dimensions)",
             "type": "string-array",
@@ -362,7 +366,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (hashed partiti
             "info": <p>
               The dimension to partition on.
             </p>,
-            "label": "Partition dimension",
             "name": "tuningConfig.partitionsSpec.partitionDimension",
             "required": true,
             "type": "string",
@@ -372,7 +375,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (hashed partiti
             "info": <p>
               Target number of rows to include in a partition, should be a number that targets segments of 500MB~1GB.
             </p>,
-            "label": "Target rows per segment",
             "name": "tuningConfig.partitionsSpec.targetRowsPerSegment",
             "required": [Function],
             "type": "number",
@@ -383,7 +385,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (hashed partiti
             "info": <p>
               Maximum number of rows to include in a partition.
             </p>,
-            "label": "Max rows per segment",
             "name": "tuningConfig.partitionsSpec.maxRowsPerSegment",
             "required": [Function],
             "type": "number",
@@ -395,48 +396,65 @@ exports[`CompactionDialog matches snapshot with compactionConfig (hashed partiti
             "info": <p>
               Assume that input data has already been grouped on time and dimensions. Ingestion will run faster, but may choose sub-optimal partitions if this assumption is violated.
             </p>,
-            "label": "Assume grouped",
             "name": "tuningConfig.partitionsSpec.assumeGrouped",
             "type": "boolean",
           },
+          Object {
+            "defaultValue": 419430400,
+            "info": <p>
+              Maximum number of total segment bytes processed per compaction task. Since a time chunk must be processed in its entirety, if the segments for a particular time chunk have a total size in bytes greater than this parameter, compaction will not run for that time chunk. Because each compaction task runs with a single thread, setting this value too far above 1–2GB will result in compaction tasks taking an excessive amount of time.
+            </p>,
+            "name": "inputSegmentSizeBytes",
+            "type": "number",
+          },
           Object {
             "defaultValue": 1,
             "info": <React.Fragment>
               Maximum number of tasks which can be run at the same time. The supervisor task would spawn worker tasks up to maxNumConcurrentSubTasks regardless of the available task slots. If this value is set to 1, the supervisor task processes data ingestion on its own instead of spawning worker tasks. If this value is set to too large, too many worker tasks can be created which might block other ingestion.
             </React.Fragment>,
-            "label": "Max num concurrent sub tasks",
             "min": 1,
             "name": "tuningConfig.maxNumConcurrentSubTasks",
             "type": "number",
           },
-          Object {
-            "defaultValue": 419430400,
-            "info": <p>
-              Maximum number of total segment bytes processed per compaction task. Since a time chunk must be processed in its entirety, if the segments for a particular time chunk have a total size in bytes greater than this parameter, compaction will not run for that time chunk. Because each compaction task runs with a single thread, setting this value too far above 1–2GB will result in compaction tasks taking an excessive amount of time.
-            </p>,
-            "name": "inputSegmentSizeBytes",
-            "type": "number",
-          },
           Object {
             "defaultValue": 10,
             "defined": [Function],
             "info": <React.Fragment>
               Maximum number of merge tasks which can be run at the same time.
             </React.Fragment>,
-            "label": "Total num merge tasks",
             "min": 1,
             "name": "tuningConfig.totalNumMergeTasks",
             "type": "number",
           },
           Object {
             "adjustment": [Function],
-            "defaultValue": 500000000,
+            "defaultValue": 1073741824,
+            "hideInMore": true,
             "info": <React.Fragment>
               Maximum number of bytes of input segments to process in a single task. If a single segment is larger than this number, it will be processed by itself in a single task (input segments are never split across tasks).
             </React.Fragment>,
-            "label": "Max input segment bytes per task",
             "min": 1000000,
-            "name": "tuningConfig.splitHintSpec.maxInputSegmentBytesPerTask",
+            "name": "tuningConfig.splitHintSpec.maxSplitSize",
+            "type": "number",
+          },
+          Object {
+            "adjustment": [Function],
+            "defaultValue": 1000,
+            "hideInMore": true,
+            "info": <React.Fragment>
+              Maximum number of input segments to process in a single subtask. This limit is to avoid task failures when the ingestion spec is too long. There are two known limits on the max size of serialized ingestion spec, i.e., the max ZNode size in ZooKeeper (
+              <Unknown>
+                jute.maxbuffer
+              </Unknown>
+              ) and the max packet size in MySQL (
+              <Unknown>
+                max_allowed_packet
+              </Unknown>
+              ). These can make ingestion tasks fail if the serialized ingestion spec size hits one of them.
+            </React.Fragment>,
+            "label": "Max num files (segments)",
+            "min": 1,
+            "name": "tuningConfig.splitHintSpec.maxNumFiles",
             "type": "number",
           },
         ]
@@ -543,7 +561,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (single_dim par
             "info": <React.Fragment>
               Determines how many rows are in each segment.
             </React.Fragment>,
-            "label": "Max rows per segment",
             "name": "tuningConfig.partitionsSpec.maxRowsPerSegment",
             "type": "number",
           },
@@ -553,7 +570,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (single_dim par
             "info": <React.Fragment>
               Total number of rows in segments waiting for being pushed.
             </React.Fragment>,
-            "label": "Max total rows",
             "name": "tuningConfig.partitionsSpec.maxTotalRows",
             "type": "number",
           },
@@ -567,7 +583,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (single_dim par
                 A target row count for each partition. Each partition will have a row count close to the target assuming evenly distributed keys. Defaults to 5 million if numShards is null.
               </p>
             </React.Fragment>,
-            "label": "Target rows per segment",
             "name": "tuningConfig.partitionsSpec.targetRowsPerSegment",
             "type": "number",
             "zeroMeansUndefined": true,
@@ -582,7 +597,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (single_dim par
                 Directly specify the number of shards to create. If this is specified and 'intervals' is specified in the granularitySpec, the index task can skip the determine intervals/partitions pass through the data.
               </p>
             </React.Fragment>,
-            "label": "Num shards",
             "name": "tuningConfig.partitionsSpec.numShards",
             "type": "number",
             "zeroMeansUndefined": true,
@@ -592,7 +606,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (single_dim par
             "info": <p>
               The dimensions to partition on. Leave blank to select all dimensions.
             </p>,
-            "label": "Partition dimensions",
             "name": "tuningConfig.partitionsSpec.partitionDimensions",
             "placeholder": "(all dimensions)",
             "type": "string-array",
@@ -602,7 +615,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (single_dim par
             "info": <p>
               The dimension to partition on.
             </p>,
-            "label": "Partition dimension",
             "name": "tuningConfig.partitionsSpec.partitionDimension",
             "required": true,
             "type": "string",
@@ -612,7 +624,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (single_dim par
             "info": <p>
               Target number of rows to include in a partition, should be a number that targets segments of 500MB~1GB.
             </p>,
-            "label": "Target rows per segment",
             "name": "tuningConfig.partitionsSpec.targetRowsPerSegment",
             "required": [Function],
             "type": "number",
@@ -623,7 +634,6 @@ exports[`CompactionDialog matches snapshot with compactionConfig (single_dim par
             "info": <p>
               Maximum number of rows to include in a partition.
             </p>,
-            "label": "Max rows per segment",
             "name": "tuningConfig.partitionsSpec.maxRowsPerSegment",
             "required": [Function],
             "type": "number",
@@ -635,48 +645,65 @@ exports[`CompactionDialog matches snapshot with compactionConfig (single_dim par
             "info": <p>
               Assume that input data has already been grouped on time and dimensions. Ingestion will run faster, but may choose sub-optimal partitions if this assumption is violated.
             </p>,
-            "label": "Assume grouped",
             "name": "tuningConfig.partitionsSpec.assumeGrouped",
             "type": "boolean",
           },
+          Object {
+            "defaultValue": 419430400,
+            "info": <p>
+              Maximum number of total segment bytes processed per compaction task. Since a time chunk must be processed in its entirety, if the segments for a particular time chunk have a total size in bytes greater than this parameter, compaction will not run for that time chunk. Because each compaction task runs with a single thread, setting this value too far above 1–2GB will result in compaction tasks taking an excessive amount of time.
+            </p>,
+            "name": "inputSegmentSizeBytes",
+            "type": "number",
+          },
           Object {
             "defaultValue": 1,
             "info": <React.Fragment>
               Maximum number of tasks which can be run at the same time. The supervisor task would spawn worker tasks up to maxNumConcurrentSubTasks regardless of the available task slots. If this value is set to 1, the supervisor task processes data ingestion on its own instead of spawning worker tasks. If this value is set to too large, too many worker tasks can be created which might block other ingestion.
             </React.Fragment>,
-            "label": "Max num concurrent sub tasks",
             "min": 1,
             "name": "tuningConfig.maxNumConcurrentSubTasks",
             "type": "number",
           },
-          Object {
-            "defaultValue": 419430400,
-            "info": <p>
-              Maximum number of total segment bytes processed per compaction task. Since a time chunk must be processed in its entirety, if the segments for a particular time chunk have a total size in bytes greater than this parameter, compaction will not run for that time chunk. Because each compaction task runs with a single thread, setting this value too far above 1–2GB will result in compaction tasks taking an excessive amount of time.
-            </p>,
-            "name": "inputSegmentSizeBytes",
-            "type": "number",
-          },
           Object {
             "defaultValue": 10,
             "defined": [Function],
             "info": <React.Fragment>
               Maximum number of merge tasks which can be run at the same time.
             </React.Fragment>,
-            "label": "Total num merge tasks",
             "min": 1,
             "name": "tuningConfig.totalNumMergeTasks",
             "type": "number",
           },
           Object {
             "adjustment": [Function],
-            "defaultValue": 500000000,
+            "defaultValue": 1073741824,
+            "hideInMore": true,
             "info": <React.Fragment>
               Maximum number of bytes of input segments to process in a single task. If a single segment is larger than this number, it will be processed by itself in a single task (input segments are never split across tasks).
             </React.Fragment>,
-            "label": "Max input segment bytes per task",
             "min": 1000000,
-            "name": "tuningConfig.splitHintSpec.maxInputSegmentBytesPerTask",
+            "name": "tuningConfig.splitHintSpec.maxSplitSize",
+            "type": "number",
+          },
+          Object {
+            "adjustment": [Function],
+            "defaultValue": 1000,
+            "hideInMore": true,
+            "info": <React.Fragment>
+              Maximum number of input segments to process in a single subtask. This limit is to avoid task failures when the ingestion spec is too long. There are two known limits on the max size of serialized ingestion spec, i.e., the max ZNode size in ZooKeeper (
+              <Unknown>
+                jute.maxbuffer
+              </Unknown>
+              ) and the max packet size in MySQL (
+              <Unknown>
+                max_allowed_packet
+              </Unknown>
+              ). These can make ingestion tasks fail if the serialized ingestion spec size hits one of them.
+            </React.Fragment>,
+            "label": "Max num files (segments)",
+            "min": 1,
+            "name": "tuningConfig.splitHintSpec.maxNumFiles",
             "type": "number",
           },
         ]
@@ -783,7 +810,6 @@ exports[`CompactionDialog matches snapshot without compactionConfig 1`] = `
             "info": <React.Fragment>
               Determines how many rows are in each segment.
             </React.Fragment>,
-            "label": "Max rows per segment",
             "name": "tuningConfig.partitionsSpec.maxRowsPerSegment",
             "type": "number",
           },
@@ -793,7 +819,6 @@ exports[`CompactionDialog matches snapshot without compactionConfig 1`] = `
             "info": <React.Fragment>
               Total number of rows in segments waiting for being pushed.
             </React.Fragment>,
-            "label": "Max total rows",
             "name": "tuningConfig.partitionsSpec.maxTotalRows",
             "type": "number",
           },
@@ -807,7 +832,6 @@ exports[`CompactionDialog matches snapshot without compactionConfig 1`] = `
                 A target row count for each partition. Each partition will have a row count close to the target assuming evenly distributed keys. Defaults to 5 million if numShards is null.
               </p>
             </React.Fragment>,
-            "label": "Target rows per segment",
             "name": "tuningConfig.partitionsSpec.targetRowsPerSegment",
             "type": "number",
             "zeroMeansUndefined": true,
@@ -822,7 +846,6 @@ exports[`CompactionDialog matches snapshot without compactionConfig 1`] = `
                 Directly specify the number of shards to create. If this is specified and 'intervals' is specified in the granularitySpec, the index task can skip the determine intervals/partitions pass through the data.
               </p>
             </React.Fragment>,
-            "label": "Num shards",
             "name": "tuningConfig.partitionsSpec.numShards",
             "type": "number",
             "zeroMeansUndefined": true,
@@ -832,7 +855,6 @@ exports[`CompactionDialog matches snapshot without compactionConfig 1`] = `
             "info": <p>
               The dimensions to partition on. Leave blank to select all dimensions.
             </p>,
-            "label": "Partition dimensions",
             "name": "tuningConfig.partitionsSpec.partitionDimensions",
             "placeholder": "(all dimensions)",
             "type": "string-array",
@@ -842,7 +864,6 @@ exports[`CompactionDialog matches snapshot without compactionConfig 1`] = `
             "info": <p>
               The dimension to partition on.
             </p>,
-            "label": "Partition dimension",
             "name": "tuningConfig.partitionsSpec.partitionDimension",
             "required": true,
             "type": "string",
@@ -852,7 +873,6 @@ exports[`CompactionDialog matches snapshot without compactionConfig 1`] = `
             "info": <p>
               Target number of rows to include in a partition, should be a number that targets segments of 500MB~1GB.
             </p>,
-            "label": "Target rows per segment",
             "name": "tuningConfig.partitionsSpec.targetRowsPerSegment",
             "required": [Function],
             "type": "number",
@@ -863,7 +883,6 @@ exports[`CompactionDialog matches snapshot without compactionConfig 1`] = `
             "info": <p>
               Maximum number of rows to include in a partition.
             </p>,
-            "label": "Max rows per segment",
             "name": "tuningConfig.partitionsSpec.maxRowsPerSegment",
             "required": [Function],
             "type": "number",
@@ -875,48 +894,65 @@ exports[`CompactionDialog matches snapshot without compactionConfig 1`] = `
             "info": <p>
               Assume that input data has already been grouped on time and dimensions. Ingestion will run faster, but may choose sub-optimal partitions if this assumption is violated.
             </p>,
-            "label": "Assume grouped",
             "name": "tuningConfig.partitionsSpec.assumeGrouped",
             "type": "boolean",
           },
+          Object {
+            "defaultValue": 419430400,
+            "info": <p>
+              Maximum number of total segment bytes processed per compaction task. Since a time chunk must be processed in its entirety, if the segments for a particular time chunk have a total size in bytes greater than this parameter, compaction will not run for that time chunk. Because each compaction task runs with a single thread, setting this value too far above 1–2GB will result in compaction tasks taking an excessive amount of time.
+            </p>,
+            "name": "inputSegmentSizeBytes",
+            "type": "number",
+          },
           Object {
             "defaultValue": 1,
             "info": <React.Fragment>
               Maximum number of tasks which can be run at the same time. The supervisor task would spawn worker tasks up to maxNumConcurrentSubTasks regardless of the available task slots. If this value is set to 1, the supervisor task processes data ingestion on its own instead of spawning worker tasks. If this value is set to too large, too many worker tasks can be created which might block other ingestion.
             </React.Fragment>,
-            "label": "Max num concurrent sub tasks",
             "min": 1,
             "name": "tuningConfig.maxNumConcurrentSubTasks",
             "type": "number",
           },
-          Object {
-            "defaultValue": 419430400,
-            "info": <p>
-              Maximum number of total segment bytes processed per compaction task. Since a time chunk must be processed in its entirety, if the segments for a particular time chunk have a total size in bytes greater than this parameter, compaction will not run for that time chunk. Because each compaction task runs with a single thread, setting this value too far above 1–2GB will result in compaction tasks taking an excessive amount of time.
-            </p>,
-            "name": "inputSegmentSizeBytes",
-            "type": "number",
-          },
           Object {
             "defaultValue": 10,
             "defined": [Function],
             "info": <React.Fragment>
               Maximum number of merge tasks which can be run at the same time.
             </React.Fragment>,
-            "label": "Total num merge tasks",
             "min": 1,
             "name": "tuningConfig.totalNumMergeTasks",
             "type": "number",
           },
           Object {
             "adjustment": [Function],
-            "defaultValue": 500000000,
+            "defaultValue": 1073741824,
+            "hideInMore": true,
             "info": <React.Fragment>
               Maximum number of bytes of input segments to process in a single task. If a single segment is larger than this number, it will be processed by itself in a single task (input segments are never split across tasks).
             </React.Fragment>,
-            "label": "Max input segment bytes per task",
             "min": 1000000,
-            "name": "tuningConfig.splitHintSpec.maxInputSegmentBytesPerTask",
+            "name": "tuningConfig.splitHintSpec.maxSplitSize",
+            "type": "number",
+          },
+          Object {
+            "adjustment": [Function],
+            "defaultValue": 1000,
+            "hideInMore": true,
+            "info": <React.Fragment>
+              Maximum number of input segments to process in a single subtask. This limit is to avoid task failures when the ingestion spec is too long. There are two known limits on the max size of serialized ingestion spec, i.e., the max ZNode size in ZooKeeper (
+              <Unknown>
+                jute.maxbuffer
+              </Unknown>
+              ) and the max packet size in MySQL (
+              <Unknown>
+                max_allowed_packet
+              </Unknown>
+              ). These can make ingestion tasks fail if the serialized ingestion spec size hits one of them.
+            </React.Fragment>,
+            "label": "Max num files (segments)",
+            "min": 1,
+            "name": "tuningConfig.splitHintSpec.maxNumFiles",
             "type": "number",
           },
         ]
diff --git a/web-console/src/dialogs/lookup-edit-dialog/__snapshots__/lookup-edit-dialog.spec.tsx.snap b/web-console/src/dialogs/lookup-edit-dialog/__snapshots__/lookup-edit-dialog.spec.tsx.snap
index 7b7dabc71a8b..e5056501c0cd 100644
--- a/web-console/src/dialogs/lookup-edit-dialog/__snapshots__/lookup-edit-dialog.spec.tsx.snap
+++ b/web-console/src/dialogs/lookup-edit-dialog/__snapshots__/lookup-edit-dialog.spec.tsx.snap
@@ -158,7 +158,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
             "defaultValue": 0,
             "defined": [Function],
             "info": "Number of header rows to be skipped. The default number of header rows to be skipped is 0.",
-            "label": "Skip header rows",
             "name": "extractionNamespace.namespaceParseSpec.skipHeaderRows",
             "type": "number",
           },
@@ -166,14 +165,12 @@ exports[`LookupEditDialog matches snapshot 1`] = `
             "defaultValue": false,
             "defined": [Function],
             "info": "A flag to indicate that column information can be extracted from the input files' header row",
-            "label": "Has header row",
             "name": "extractionNamespace.namespaceParseSpec.hasHeaderRow",
             "type": "boolean",
           },
           Object {
             "defined": [Function],
             "info": "The list of columns in the csv file",
-            "label": "Columns",
             "name": "extractionNamespace.namespaceParseSpec.columns",
             "placeholder": "[\\"key\\", \\"value\\"]",
             "required": [Function],
@@ -182,7 +179,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
           Object {
             "defined": [Function],
             "info": "The name of the column containing the key",
-            "label": "Key column",
             "name": "extractionNamespace.namespaceParseSpec.keyColumn",
             "placeholder": "(optional - defaults to the first column)",
             "type": "string",
@@ -190,28 +186,24 @@ exports[`LookupEditDialog matches snapshot 1`] = `
           Object {
             "defined": [Function],
             "info": "The name of the column containing the value",
-            "label": "Value column",
             "name": "extractionNamespace.namespaceParseSpec.valueColumn",
             "placeholder": "(optional - defaults to the second column)",
             "type": "string",
           },
           Object {
             "defined": [Function],
-            "label": "Delimiter",
             "name": "extractionNamespace.namespaceParseSpec.delimiter",
             "placeholder": "(optional)",
             "type": "string",
           },
           Object {
             "defined": [Function],
-            "label": "List delimiter",
             "name": "extractionNamespace.namespaceParseSpec.listDelimiter",
             "placeholder": "(optional)",
             "type": "string",
           },
           Object {
             "defined": [Function],
-            "label": "Key field name",
             "name": "extractionNamespace.namespaceParseSpec.keyFieldName",
             "placeholder": "key",
             "required": true,
@@ -219,7 +211,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
           },
           Object {
             "defined": [Function],
-            "label": "Value field name",
             "name": "extractionNamespace.namespaceParseSpec.valueFieldName",
             "placeholder": "value",
             "required": true,
@@ -229,7 +220,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
             "defaultValue": "0",
             "defined": [Function],
             "info": "Period between polling for updates",
-            "label": "Poll period",
             "name": "extractionNamespace.pollPeriod",
             "type": "string",
           },
@@ -247,7 +237,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
                 .table WHERE filter
               </p>
             </React.Fragment>,
-            "label": "Namespace",
             "name": "extractionNamespace.namespace",
             "placeholder": "some_lookup",
             "required": true,
@@ -264,21 +253,18 @@ exports[`LookupEditDialog matches snapshot 1`] = `
           Object {
             "defined": [Function],
             "info": "Defines the user to be used by the connector config",
-            "label": "User",
             "name": "extractionNamespace.connectorConfig.user",
             "type": "string",
           },
           Object {
             "defined": [Function],
             "info": "Defines the password to be used by the connector config",
-            "label": "Password",
             "name": "extractionNamespace.connectorConfig.password",
             "type": "string",
           },
           Object {
             "defined": [Function],
             "info": "Should tables be created",
-            "label": "Create tables",
             "name": "extractionNamespace.connectorConfig.createTables",
             "type": "boolean",
           },
@@ -296,7 +282,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
                  WHERE filter
               </p>
             </React.Fragment>,
-            "label": "Table",
             "name": "extractionNamespace.table",
             "placeholder": "some_lookup_table",
             "required": true,
@@ -316,7 +301,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
                 , valueColumn, tsColumn? FROM namespace.table WHERE filter
               </p>
             </React.Fragment>,
-            "label": "Key column",
             "name": "extractionNamespace.keyColumn",
             "placeholder": "my_key_value",
             "required": true,
@@ -336,7 +320,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
                 , tsColumn? FROM namespace.table WHERE filter
               </p>
             </React.Fragment>,
-            "label": "Value column",
             "name": "extractionNamespace.valueColumn",
             "placeholder": "my_column_value",
             "required": true,
@@ -356,7 +339,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
                 </strong>
               </p>
             </React.Fragment>,
-            "label": "Filter",
             "name": "extractionNamespace.filter",
             "placeholder": "(optional)",
             "type": "string",
@@ -384,7 +366,6 @@ exports[`LookupEditDialog matches snapshot 1`] = `
             "defaultValue": 0,
             "defined": [Function],
             "info": "How long to wait (in ms) for the first run of the cache to populate. 0 indicates to not wait",
-            "label": "First cache timeout",
             "name": "firstCacheTimeout",
             "type": "number",
           },
diff --git a/web-console/src/druid-models/compaction-config.tsx b/web-console/src/druid-models/compaction-config.tsx
index 02bb42f0004e..437f91404802 100644
--- a/web-console/src/druid-models/compaction-config.tsx
+++ b/web-console/src/druid-models/compaction-config.tsx
@@ -53,7 +53,6 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   // partitionsSpec type: dynamic
   {
     name: 'tuningConfig.partitionsSpec.maxRowsPerSegment',
-    label: 'Max rows per segment',
     type: 'number',
     defaultValue: 5000000,
     defined: (t: CompactionConfig) => deepGet(t, 'tuningConfig.partitionsSpec.type') === 'dynamic',
@@ -61,7 +60,6 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   },
   {
     name: 'tuningConfig.partitionsSpec.maxTotalRows',
-    label: 'Max total rows',
     type: 'number',
     defaultValue: 20000000,
     defined: (t: CompactionConfig) => deepGet(t, 'tuningConfig.partitionsSpec.type') === 'dynamic',
@@ -70,7 +68,6 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   // partitionsSpec type: hashed
   {
     name: 'tuningConfig.partitionsSpec.targetRowsPerSegment',
-    label: 'Target rows per segment',
     type: 'number',
     zeroMeansUndefined: true,
     defined: (t: CompactionConfig) =>
@@ -91,7 +88,6 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   },
   {
     name: 'tuningConfig.partitionsSpec.numShards',
-    label: 'Num shards',
     type: 'number',
     zeroMeansUndefined: true,
     defined: (t: CompactionConfig) =>
@@ -113,7 +109,6 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   },
   {
     name: 'tuningConfig.partitionsSpec.partitionDimensions',
-    label: 'Partition dimensions',
     type: 'string-array',
     placeholder: '(all dimensions)',
     defined: (t: CompactionConfig) => deepGet(t, 'tuningConfig.partitionsSpec.type') === 'hashed',
@@ -122,7 +117,6 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   // partitionsSpec type: single_dim
   {
     name: 'tuningConfig.partitionsSpec.partitionDimension',
-    label: 'Partition dimension',
     type: 'string',
     defined: (t: CompactionConfig) =>
       deepGet(t, 'tuningConfig.partitionsSpec.type') === 'single_dim',
@@ -131,7 +125,6 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   },
   {
     name: 'tuningConfig.partitionsSpec.targetRowsPerSegment',
-    label: 'Target rows per segment',
     type: 'number',
     zeroMeansUndefined: true,
     defined: (t: CompactionConfig) =>
@@ -149,7 +142,6 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   },
   {
     name: 'tuningConfig.partitionsSpec.maxRowsPerSegment',
-    label: 'Max rows per segment',
     type: 'number',
     zeroMeansUndefined: true,
     defined: (t: CompactionConfig) =>
@@ -162,7 +154,6 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
   },
   {
     name: 'tuningConfig.partitionsSpec.assumeGrouped',
-    label: 'Assume grouped',
     type: 'boolean',
     defaultValue: false,
     defined: (t: CompactionConfig) =>
@@ -174,9 +165,22 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
       </p>
     ),
   },
+  {
+    name: 'inputSegmentSizeBytes',
+    type: 'number',
+    defaultValue: 419430400,
+    info: (
+      <p>
+        Maximum number of total segment bytes processed per compaction task. Since a time chunk must
+        be processed in its entirety, if the segments for a particular time chunk have a total size
+        in bytes greater than this parameter, compaction will not run for that time chunk. Because
+        each compaction task runs with a single thread, setting this value too far above 1–2GB will
+        result in compaction tasks taking an excessive amount of time.
+      </p>
+    ),
+  },
   {
     name: 'tuningConfig.maxNumConcurrentSubTasks',
-    label: 'Max num concurrent sub tasks',
     type: 'number',
     defaultValue: 1,
     min: 1,
@@ -190,23 +194,8 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
       </>
     ),
   },
-  {
-    name: 'inputSegmentSizeBytes',
-    type: 'number',
-    defaultValue: 419430400,
-    info: (
-      <p>
-        Maximum number of total segment bytes processed per compaction task. Since a time chunk must
-        be processed in its entirety, if the segments for a particular time chunk have a total size
-        in bytes greater than this parameter, compaction will not run for that time chunk. Because
-        each compaction task runs with a single thread, setting this value too far above 1–2GB will
-        result in compaction tasks taking an excessive amount of time.
-      </p>
-    ),
-  },
   {
     name: 'tuningConfig.totalNumMergeTasks',
-    label: 'Total num merge tasks',
     type: 'number',
     defaultValue: 10,
     min: 1,
@@ -215,12 +204,12 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
     info: <>Maximum number of merge tasks which can be run at the same time.</>,
   },
   {
-    name: 'tuningConfig.splitHintSpec.maxInputSegmentBytesPerTask',
-    label: 'Max input segment bytes per task',
+    name: 'tuningConfig.splitHintSpec.maxSplitSize',
     type: 'number',
-    defaultValue: 500000000,
+    defaultValue: 1073741824,
     min: 1000000,
-    adjustment: (t: CompactionConfig) => deepSet(t, 'tuningConfig.splitHintSpec.type', 'segments'),
+    hideInMore: true,
+    adjustment: (t: CompactionConfig) => deepSet(t, 'tuningConfig.splitHintSpec.type', 'maxSize'),
     info: (
       <>
         Maximum number of bytes of input segments to process in a single task. If a single segment
@@ -229,4 +218,23 @@ export const COMPACTION_CONFIG_FIELDS: Field<CompactionConfig>[] = [
       </>
     ),
   },
+  {
+    name: 'tuningConfig.splitHintSpec.maxNumFiles',
+    label: 'Max num files (segments)',
+    type: 'number',
+    defaultValue: 1000,
+    min: 1,
+    hideInMore: true,
+    adjustment: (t: CompactionConfig) => deepSet(t, 'tuningConfig.splitHintSpec.type', 'maxSize'),
+    info: (
+      <>
+        Maximum number of input segments to process in a single subtask. This limit is to avoid task
+        failures when the ingestion spec is too long. There are two known limits on the max size of
+        serialized ingestion spec, i.e., the max ZNode size in ZooKeeper (
+        <Code>jute.maxbuffer</Code>) and the max packet size in MySQL (
+        <Code>max_allowed_packet</Code>). These can make ingestion tasks fail if the serialized
+        ingestion spec size hits one of them.
+      </>
+    ),
+  },
 ];
diff --git a/web-console/src/druid-models/filter.tsx b/web-console/src/druid-models/filter.tsx
index 882fdd8d6757..2951dbd1905c 100644
--- a/web-console/src/druid-models/filter.tsx
+++ b/web-console/src/druid-models/filter.tsx
@@ -154,7 +154,6 @@ export const FILTERS_FIELDS: Field<IngestionSpec>[] = [
   },
   {
     name: 'spec.dataSchema.transformSpec.filter',
-    label: 'Filter',
     type: 'json',
     height: '350px',
     placeholder: '{ "type": "true" }',
diff --git a/web-console/src/druid-models/ingestion-spec.tsx b/web-console/src/druid-models/ingestion-spec.tsx
index a1783fb13115..eb5b582aee23 100644
--- a/web-console/src/druid-models/ingestion-spec.tsx
+++ b/web-console/src/druid-models/ingestion-spec.tsx
@@ -1420,7 +1420,6 @@ export function getSecondaryPartitionRelatedFormFields(
         // partitionsSpec type: dynamic
         {
           name: 'spec.tuningConfig.partitionsSpec.maxRowsPerSegment',
-          label: 'Max rows per segment',
           type: 'number',
           defaultValue: 5000000,
           defined: s => deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'dynamic',
@@ -1428,7 +1427,6 @@ export function getSecondaryPartitionRelatedFormFields(
         },
         {
           name: 'spec.tuningConfig.partitionsSpec.maxTotalRows',
-          label: 'Max total rows',
           type: 'number',
           defaultValue: 20000000,
           defined: s => deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'dynamic',
@@ -1437,7 +1435,6 @@ export function getSecondaryPartitionRelatedFormFields(
         // partitionsSpec type: hashed
         {
           name: 'spec.tuningConfig.partitionsSpec.targetRowsPerSegment',
-          label: 'Target rows per segment',
           type: 'number',
           zeroMeansUndefined: true,
           defaultValue: 5000000,
@@ -1460,7 +1457,6 @@ export function getSecondaryPartitionRelatedFormFields(
         },
         {
           name: 'spec.tuningConfig.partitionsSpec.numShards',
-          label: 'Num shards',
           type: 'number',
           zeroMeansUndefined: true,
           hideInMore: true,
@@ -1483,7 +1479,6 @@ export function getSecondaryPartitionRelatedFormFields(
         },
         {
           name: 'spec.tuningConfig.partitionsSpec.partitionDimensions',
-          label: 'Partition dimensions',
           type: 'string-array',
           placeholder: '(all dimensions)',
           defined: s => deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'hashed',
@@ -1492,7 +1487,6 @@ export function getSecondaryPartitionRelatedFormFields(
         // partitionsSpec type: single_dim
         {
           name: 'spec.tuningConfig.partitionsSpec.partitionDimension',
-          label: 'Partition dimension',
           type: 'string',
           defined: s => deepGet(s, 'spec.tuningConfig.partitionsSpec.type') === 'single_dim',
           required: true,
@@ -1512,7 +1506,6 @@ export function getSecondaryPartitionRelatedFormFields(
         },
         {
           name: 'spec.tuningConfig.partitionsSpec.targetRowsPerSegment',
-          label: 'Target rows per segment',
           type: 'number',
           zeroMeansUndefined: true,
           defined: s =>
@@ -1530,7 +1523,6 @@ export function getSecondaryPartitionRelatedFormFields(
         },
         {
           name: 'spec.tuningConfig.partitionsSpec.maxRowsPerSegment',
-          label: 'Max rows per segment',
           type: 'number',
           zeroMeansUndefined: true,
           defined: s =>
@@ -1543,7 +1535,6 @@ export function getSecondaryPartitionRelatedFormFields(
         },
         {
           name: 'spec.tuningConfig.partitionsSpec.assumeGrouped',
-          label: 'Assume grouped',
           type: 'boolean',
           defaultValue: false,
           hideInMore: true,
@@ -1562,14 +1553,12 @@ export function getSecondaryPartitionRelatedFormFields(
       return [
         {
           name: 'spec.tuningConfig.maxRowsPerSegment',
-          label: 'Max rows per segment',
           type: 'number',
           defaultValue: 5000000,
           info: <>Determines how many rows are in each segment.</>,
         },
         {
           name: 'spec.tuningConfig.maxTotalRows',
-          label: 'Max total rows',
           type: 'number',
           defaultValue: 20000000,
           info: <>Total number of rows in segments waiting for being pushed.</>,
@@ -1587,13 +1576,13 @@ export function settingIntervalsWouldSpeedUpIngestion(spec: IngestionSpec): bool
   );
 }
 
-const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
+const TUNING_FORM_FIELDS: Field<IngestionSpec>[] = [
   {
-    name: 'maxNumConcurrentSubTasks',
+    name: 'spec.tuningConfig.maxNumConcurrentSubTasks',
     type: 'number',
     defaultValue: 1,
     min: 1,
-    defined: (t: TuningConfig) => t.type === 'index_parallel',
+    defined: s => s.type === 'index_parallel',
     info: (
       <>
         Maximum number of tasks which can be run at the same time. The supervisor task would spawn
@@ -1605,41 +1594,41 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'maxRetry',
+    name: 'spec.tuningConfig.maxRetry',
     type: 'number',
     defaultValue: 3,
-    defined: (t: TuningConfig) => t.type === 'index_parallel',
+    defined: s => s.type === 'index_parallel',
     hideInMore: true,
     info: <>Maximum number of retries on task failures.</>,
   },
   {
-    name: 'taskStatusCheckPeriodMs',
+    name: 'spec.tuningConfig.taskStatusCheckPeriodMs',
     type: 'number',
     defaultValue: 1000,
-    defined: (t: TuningConfig) => t.type === 'index_parallel',
+    defined: s => s.type === 'index_parallel',
     hideInMore: true,
     info: <>Polling period in milliseconds to check running task statuses.</>,
   },
   {
-    name: 'totalNumMergeTasks',
+    name: 'spec.tuningConfig.totalNumMergeTasks',
     type: 'number',
     defaultValue: 10,
     min: 1,
-    defined: (t: TuningConfig) =>
+    defined: s =>
       Boolean(
-        t.type === 'index_parallel' &&
-          oneOf(deepGet(t, 'partitionsSpec.type'), 'hashed', 'single_dim'),
+        s.type === 'index_parallel' &&
+          oneOf(deepGet(s, 'spec.tuningConfig.partitionsSpec.type'), 'hashed', 'single_dim'),
       ),
     info: <>Number of tasks to merge partial segments after shuffle.</>,
   },
   {
-    name: 'maxNumSegmentsToMerge',
+    name: 'spec.tuningConfig.maxNumSegmentsToMerge',
     type: 'number',
     defaultValue: 100,
-    defined: (t: TuningConfig) =>
+    defined: s =>
       Boolean(
-        t.type === 'index_parallel' &&
-          oneOf(deepGet(t, 'partitionsSpec.type'), 'hashed', 'single_dim'),
+        s.type === 'index_parallel' &&
+          oneOf(deepGet(s, 'spec.tuningConfig.partitionsSpec.type'), 'hashed', 'single_dim'),
       ),
     info: (
       <>
@@ -1648,22 +1637,22 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'maxRowsInMemory',
+    name: 'spec.tuningConfig.maxRowsInMemory',
     type: 'number',
     defaultValue: 1000000,
     info: <>Used in determining when intermediate persists to disk should occur.</>,
   },
   {
-    name: 'maxBytesInMemory',
+    name: 'spec.tuningConfig.maxBytesInMemory',
     type: 'number',
     placeholder: 'Default: 1/6 of max JVM memory',
     info: <>Used in determining when intermediate persists to disk should occur.</>,
   },
   {
-    name: 'resetOffsetAutomatically',
+    name: 'spec.tuningConfig.resetOffsetAutomatically',
     type: 'boolean',
     defaultValue: false,
-    defined: (t: TuningConfig) => oneOf(t.type, 'kafka', 'kinesis'),
+    defined: s => oneOf(s.type, 'kafka', 'kinesis'),
     info: (
       <>
         Whether to reset the consumer offset if the next offset that it is trying to fetch is less
@@ -1672,10 +1661,10 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'skipSequenceNumberAvailabilityCheck',
+    name: 'spec.tuningConfig.skipSequenceNumberAvailabilityCheck',
     type: 'boolean',
     defaultValue: false,
-    defined: (t: TuningConfig) => t.type === 'kinesis',
+    defined: s => s.type === 'kinesis',
     info: (
       <>
         Whether to enable checking if the current sequence number is still available in a particular
@@ -1685,17 +1674,17 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'intermediatePersistPeriod',
+    name: 'spec.tuningConfig.intermediatePersistPeriod',
     type: 'duration',
     defaultValue: 'PT10M',
-    defined: (t: TuningConfig) => oneOf(t.type, 'kafka', 'kinesis'),
+    defined: s => oneOf(s.type, 'kafka', 'kinesis'),
     info: <>The period that determines the rate at which intermediate persists occur.</>,
   },
   {
-    name: 'intermediateHandoffPeriod',
+    name: 'spec.tuningConfig.intermediateHandoffPeriod',
     type: 'duration',
     defaultValue: 'P2147483647D',
-    defined: (t: TuningConfig) => oneOf(t.type, 'kafka', 'kinesis'),
+    defined: s => oneOf(s.type, 'kafka', 'kinesis'),
     info: (
       <>
         How often the tasks should hand off segments. Handoff will happen either if
@@ -1705,7 +1694,7 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'maxPendingPersists',
+    name: 'spec.tuningConfig.maxPendingPersists',
     type: 'number',
     hideInMore: true,
     info: (
@@ -1717,7 +1706,7 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'pushTimeout',
+    name: 'spec.tuningConfig.pushTimeout',
     type: 'number',
     defaultValue: 0,
     hideInMore: true,
@@ -1728,15 +1717,15 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'handoffConditionTimeout',
+    name: 'spec.tuningConfig.handoffConditionTimeout',
     type: 'number',
     defaultValue: 0,
-    defined: (t: TuningConfig) => oneOf(t.type, 'kafka', 'kinesis'),
+    defined: s => oneOf(s.type, 'kafka', 'kinesis'),
     hideInMore: true,
     info: <>Milliseconds to wait for segment handoff. 0 means to wait forever.</>,
   },
   {
-    name: 'indexSpec.bitmap.type',
+    name: 'spec.tuningConfig.indexSpec.bitmap.type',
     label: 'Index bitmap type',
     type: 'string',
     defaultValue: 'roaring',
@@ -1745,7 +1734,7 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     info: <>Compression format for bitmap indexes.</>,
   },
   {
-    name: 'indexSpec.dimensionCompression',
+    name: 'spec.tuningConfig.indexSpec.dimensionCompression',
     label: 'Index dimension compression',
     type: 'string',
     defaultValue: 'lz4',
@@ -1754,7 +1743,7 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     info: <>Compression format for dimension columns.</>,
   },
   {
-    name: 'indexSpec.metricCompression',
+    name: 'spec.tuningConfig.indexSpec.metricCompression',
     label: 'Index metric compression',
     type: 'string',
     defaultValue: 'lz4',
@@ -1763,7 +1752,7 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     info: <>Compression format for primitive type metric columns.</>,
   },
   {
-    name: 'indexSpec.longEncoding',
+    name: 'spec.tuningConfig.indexSpec.longEncoding',
     label: 'Index long encoding',
     type: 'string',
     defaultValue: 'longs',
@@ -1779,43 +1768,79 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'chatHandlerTimeout',
+    name: 'spec.tuningConfig.splitHintSpec.maxSplitSize',
+    type: 'number',
+    defaultValue: 1073741824,
+    min: 1000000,
+    defined: s =>
+      s.type === 'index_parallel' && deepGet(s, 'spec.ioConfig.inputFormat.type') !== 'http',
+    hideInMore: true,
+    adjustment: s => deepSet(s, 'splitHintSpec.type', 'maxSize'),
+    info: (
+      <>
+        Maximum number of bytes of input files to process in a single subtask. If a single file is
+        larger than this number, it will be processed by itself in a single subtask (Files are never
+        split across tasks yet).
+      </>
+    ),
+  },
+  {
+    name: 'spec.tuningConfig.splitHintSpec.maxNumFiles',
+    type: 'number',
+    defaultValue: 1000,
+    min: 1,
+    defined: s => s.type === 'index_parallel',
+    hideInMore: true,
+    adjustment: s => deepSet(s, 'splitHintSpec.type', 'maxSize'),
+    info: (
+      <>
+        Maximum number of input files to process in a single subtask. This limit is to avoid task
+        failures when the ingestion spec is too long. There are two known limits on the max size of
+        serialized ingestion spec, i.e., the max ZNode size in ZooKeeper (
+        <Code>jute.maxbuffer</Code>) and the max packet size in MySQL (
+        <Code>max_allowed_packet</Code>). These can make ingestion tasks fail if the serialized
+        ingestion spec size hits one of them.
+      </>
+    ),
+  },
+  {
+    name: 'spec.tuningConfig.chatHandlerTimeout',
     type: 'duration',
     defaultValue: 'PT10S',
-    defined: (t: TuningConfig) => t.type === 'index_parallel',
+    defined: s => s.type === 'index_parallel',
     hideInMore: true,
     info: <>Timeout for reporting the pushed segments in worker tasks.</>,
   },
   {
-    name: 'chatHandlerNumRetries',
+    name: 'spec.tuningConfig.chatHandlerNumRetries',
     type: 'number',
     defaultValue: 5,
-    defined: (t: TuningConfig) => t.type === 'index_parallel',
+    defined: s => s.type === 'index_parallel',
     hideInMore: true,
     info: <>Retries for reporting the pushed segments in worker tasks.</>,
   },
   {
-    name: 'workerThreads',
+    name: 'spec.tuningConfig.workerThreads',
     type: 'number',
     placeholder: 'min(10, taskCount)',
-    defined: (t: TuningConfig) => oneOf(t.type, 'kafka', 'kinesis'),
+    defined: s => oneOf(s.type, 'kafka', 'kinesis'),
     info: (
       <>The number of threads that will be used by the supervisor for asynchronous operations.</>
     ),
   },
   {
-    name: 'chatThreads',
+    name: 'spec.tuningConfig.chatThreads',
     type: 'number',
     placeholder: 'min(10, taskCount * replicas)',
-    defined: (t: TuningConfig) => oneOf(t.type, 'kafka', 'kinesis'),
+    defined: s => oneOf(s.type, 'kafka', 'kinesis'),
     hideInMore: true,
     info: <>The number of threads that will be used for communicating with indexing tasks.</>,
   },
   {
-    name: 'chatRetries',
+    name: 'spec.tuningConfig.chatRetries',
     type: 'number',
     defaultValue: 8,
-    defined: (t: TuningConfig) => oneOf(t.type, 'kafka', 'kinesis'),
+    defined: s => oneOf(s.type, 'kafka', 'kinesis'),
     hideInMore: true,
     info: (
       <>
@@ -1825,17 +1850,17 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'httpTimeout',
+    name: 'spec.tuningConfig.httpTimeout',
     type: 'duration',
     defaultValue: 'PT10S',
-    defined: (t: TuningConfig) => oneOf(t.type, 'kafka', 'kinesis'),
+    defined: s => oneOf(s.type, 'kafka', 'kinesis'),
     info: <>How long to wait for a HTTP response from an indexing task.</>,
   },
   {
-    name: 'shutdownTimeout',
+    name: 'spec.tuningConfig.shutdownTimeout',
     type: 'duration',
     defaultValue: 'PT80S',
-    defined: (t: TuningConfig) => oneOf(t.type, 'kafka', 'kinesis'),
+    defined: s => oneOf(s.type, 'kafka', 'kinesis'),
     hideInMore: true,
     info: (
       <>
@@ -1844,10 +1869,10 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'offsetFetchPeriod',
+    name: 'spec.tuningConfig.offsetFetchPeriod',
     type: 'duration',
     defaultValue: 'PT30S',
-    defined: (t: TuningConfig) => t.type === 'kafka',
+    defined: s => s.type === 'kafka',
     info: (
       <>
         How often the supervisor queries Kafka and the indexing tasks to fetch current offsets and
@@ -1856,10 +1881,10 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'recordBufferSize',
+    name: 'spec.tuningConfig.recordBufferSize',
     type: 'number',
     defaultValue: 10000,
-    defined: (t: TuningConfig) => t.type === 'kinesis',
+    defined: s => s.type === 'kinesis',
     info: (
       <>
         Size of the buffer (number of events) used between the Kinesis fetch threads and the main
@@ -1868,10 +1893,10 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'recordBufferOfferTimeout',
+    name: 'spec.tuningConfig.recordBufferOfferTimeout',
     type: 'number',
     defaultValue: 5000,
-    defined: (t: TuningConfig) => t.type === 'kinesis',
+    defined: s => s.type === 'kinesis',
     hideInMore: true,
     info: (
       <>
@@ -1881,11 +1906,11 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'recordBufferFullWait',
+    name: 'spec.tuningConfig.recordBufferFullWait',
     hideInMore: true,
     type: 'number',
     defaultValue: 5000,
-    defined: (t: TuningConfig) => t.type === 'kinesis',
+    defined: s => s.type === 'kinesis',
     info: (
       <>
         Length of time in milliseconds to wait for the buffer to drain before attempting to fetch
@@ -1894,10 +1919,10 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'fetchSequenceNumberTimeout',
+    name: 'spec.tuningConfig.fetchSequenceNumberTimeout',
     type: 'number',
     defaultValue: 60000,
-    defined: (t: TuningConfig) => t.type === 'kinesis',
+    defined: s => s.type === 'kinesis',
     hideInMore: true,
     info: (
       <>
@@ -1909,10 +1934,10 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'fetchThreads',
+    name: 'spec.tuningConfig.fetchThreads',
     type: 'number',
     placeholder: 'max(1, {numProcessors} - 1)',
-    defined: (t: TuningConfig) => t.type === 'kinesis',
+    defined: s => s.type === 'kinesis',
     hideInMore: true,
     info: (
       <>
@@ -1922,10 +1947,10 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'maxRecordsPerPoll',
+    name: 'spec.tuningConfig.maxRecordsPerPoll',
     type: 'number',
     defaultValue: 100,
-    defined: (t: TuningConfig) => t.type === 'kinesis',
+    defined: s => s.type === 'kinesis',
     hideInMore: true,
     info: (
       <>
@@ -1935,10 +1960,10 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
     ),
   },
   {
-    name: 'repartitionTransitionDuration',
+    name: 'spec.tuningConfig.repartitionTransitionDuration',
     type: 'duration',
     defaultValue: 'PT2M',
-    defined: (t: TuningConfig) => t.type === 'kinesis',
+    defined: s => s.type === 'kinesis',
     hideInMore: true,
     info: (
       <>
@@ -1959,8 +1984,8 @@ const TUNING_CONFIG_FORM_FIELDS: Field<TuningConfig>[] = [
   },
 ];
 
-export function getTuningSpecFormFields() {
-  return TUNING_CONFIG_FORM_FIELDS;
+export function getTuningFormFields() {
+  return TUNING_FORM_FIELDS;
 }
 
 export interface IndexSpec {
diff --git a/web-console/src/druid-models/lookup-spec.tsx b/web-console/src/druid-models/lookup-spec.tsx
index c9e0e5a13bde..31405f311719 100644
--- a/web-console/src/druid-models/lookup-spec.tsx
+++ b/web-console/src/druid-models/lookup-spec.tsx
@@ -104,8 +104,8 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   // cachedNamespace lookups have more options
   {
     name: 'extractionNamespace.type',
-    type: 'string',
     label: 'Globally cached lookup type',
+    type: 'string',
     placeholder: 'uri',
     suggestions: ['uri', 'jdbc'],
     defined: (model: LookupSpec) => model.type === 'cachedNamespace',
@@ -113,8 +113,8 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   },
   {
     name: 'extractionNamespace.uriPrefix',
-    type: 'string',
     label: 'URI prefix',
+    type: 'string',
     placeholder: 's3://bucket/some/key/prefix/',
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -145,8 +145,8 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   },
   {
     name: 'extractionNamespace.fileRegex',
-    type: 'string',
     label: 'File regex',
+    type: 'string',
     defaultValue: '.*',
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -157,8 +157,8 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   // namespaceParseSpec
   {
     name: 'extractionNamespace.namespaceParseSpec.format',
-    type: 'string',
     label: 'Parse format',
+    type: 'string',
     suggestions: ['csv', 'tsv', 'simpleJson', 'customJson'],
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'uri',
     required: true,
@@ -177,7 +177,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespaceParseSpec.skipHeaderRows',
     type: 'number',
-    label: 'Skip header rows',
     defaultValue: 0,
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -187,7 +186,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespaceParseSpec.hasHeaderRow',
     type: 'boolean',
-    label: 'Has header row',
     defaultValue: false,
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -197,7 +195,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespaceParseSpec.columns',
     type: 'string-array',
-    label: 'Columns',
     placeholder: `["key", "value"]`,
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -209,7 +206,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespaceParseSpec.keyColumn',
     type: 'string',
-    label: 'Key column',
     placeholder: '(optional - defaults to the first column)',
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -219,7 +215,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespaceParseSpec.valueColumn',
     type: 'string',
-    label: 'Value column',
     placeholder: '(optional - defaults to the second column)',
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -231,7 +226,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespaceParseSpec.delimiter',
     type: 'string',
-    label: 'Delimiter',
     placeholder: `(optional)`,
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -240,7 +234,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespaceParseSpec.listDelimiter',
     type: 'string',
-    label: 'List delimiter',
     placeholder: `(optional)`,
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -251,7 +244,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespaceParseSpec.keyFieldName',
     type: 'string',
-    label: 'Key field name',
     placeholder: `key`,
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -261,7 +253,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespaceParseSpec.valueFieldName',
     type: 'string',
-    label: 'Value field name',
     placeholder: `value`,
     defined: (model: LookupSpec) =>
       deepGet(model, 'extractionNamespace.type') === 'uri' &&
@@ -271,7 +262,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.pollPeriod',
     type: 'string',
-    label: 'Poll period',
     defaultValue: '0',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'uri',
     info: `Period between polling for updates`,
@@ -281,7 +271,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.namespace',
     type: 'string',
-    label: 'Namespace',
     placeholder: 'some_lookup',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'jdbc',
     required: true,
@@ -297,8 +286,8 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   },
   {
     name: 'extractionNamespace.connectorConfig.connectURI',
-    type: 'string',
     label: 'Connect URI',
+    type: 'string',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'jdbc',
     required: true,
     info: 'Defines the connectURI value on the The connector config to used',
@@ -306,28 +295,24 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.connectorConfig.user',
     type: 'string',
-    label: 'User',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'jdbc',
     info: 'Defines the user to be used by the connector config',
   },
   {
     name: 'extractionNamespace.connectorConfig.password',
     type: 'string',
-    label: 'Password',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'jdbc',
     info: 'Defines the password to be used by the connector config',
   },
   {
     name: 'extractionNamespace.connectorConfig.createTables',
     type: 'boolean',
-    label: 'Create tables',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'jdbc',
     info: 'Should tables be created',
   },
   {
     name: 'extractionNamespace.table',
     type: 'string',
-    label: 'Table',
     placeholder: 'some_lookup_table',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'jdbc',
     required: true,
@@ -347,7 +332,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.keyColumn',
     type: 'string',
-    label: 'Key column',
     placeholder: 'my_key_value',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'jdbc',
     required: true,
@@ -367,7 +351,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.valueColumn',
     type: 'string',
-    label: 'Value column',
     placeholder: 'my_column_value',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'jdbc',
     required: true,
@@ -387,7 +370,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'extractionNamespace.filter',
     type: 'string',
-    label: 'Filter',
     placeholder: '(optional)',
     defined: (model: LookupSpec) => deepGet(model, 'extractionNamespace.type') === 'jdbc',
     info: (
@@ -427,7 +409,6 @@ export const LOOKUP_FIELDS: Field<LookupSpec>[] = [
   {
     name: 'firstCacheTimeout',
     type: 'number',
-    label: 'First cache timeout',
     defaultValue: 0,
     defined: (model: LookupSpec) => model.type === 'cachedNamespace',
     info: `How long to wait (in ms) for the first run of the cache to populate. 0 indicates to not wait`,
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 4ee62e15e569..898482e81f4d 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -98,7 +98,7 @@ import {
   getRollup,
   getSecondaryPartitionRelatedFormFields,
   getSpecType,
-  getTuningSpecFormFields,
+  getTuningFormFields,
   IngestionComboTypeWithExtra,
   IngestionSpec,
   InputFormat,
@@ -2935,7 +2935,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
               <Callout icon={IconNames.LIGHTBULB}>
                 You can make this ingestion run slightly faster by explicitly specifying the time
                 intervals for this dataset from the{' '}
-                <a onClick={() => this.updateStep('filter')}>Filter step</a>.
+                <a onClick={() => this.updateStep('filter')}>Filter</a> step.
               </Callout>
             </FormGroup>
           )}
@@ -2952,7 +2952,6 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
   renderTuningStep() {
     const { spec } = this.state;
     const ioConfig: IoConfig = deepGet(spec, 'spec.ioConfig') || EMPTY_OBJECT;
-    const tuningConfig: TuningConfig = deepGet(spec, 'spec.tuningConfig') || EMPTY_OBJECT;
 
     const ingestionComboType = getIngestionComboType(spec);
     const inputTuningFields = ingestionComboType
@@ -2989,11 +2988,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
         </div>
         <div className="other">
           <H5>General tuning</H5>
-          <AutoForm
-            fields={getTuningSpecFormFields()}
-            model={tuningConfig}
-            onChange={t => this.updateSpec(deepSet(spec, 'spec.tuningConfig', t))}
-          />
+          <AutoForm fields={getTuningFormFields()} model={spec} onChange={this.updateSpec} />
         </div>
         <div className="control">
           <TuningMessage />

From 076308b4d5492828c47b24690e46b8ac52732c46 Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Tue, 8 Dec 2020 09:46:58 -0800
Subject: [PATCH 09/14] highlight issues with spec

---
 .../src/druid-models/ingestion-spec.tsx       | 20 +++++++++++++++++++
 .../views/load-data-view/load-data-view.tsx   | 18 +++++++++--------
 2 files changed, 30 insertions(+), 8 deletions(-)

diff --git a/web-console/src/druid-models/ingestion-spec.tsx b/web-console/src/druid-models/ingestion-spec.tsx
index 8e32751ac30f..1cfd841a4d8c 100644
--- a/web-console/src/druid-models/ingestion-spec.tsx
+++ b/web-console/src/druid-models/ingestion-spec.tsx
@@ -226,6 +226,26 @@ export function getRequiredModule(ingestionType: IngestionComboTypeWithExtra): s
   }
 }
 
+export function getIssueWithSpec(spec: IngestionSpec): string | undefined {
+  if (!deepGet(spec, 'spec.dataSchema.dataSource')) {
+    return 'missing spec.dataSchema.dataSource';
+  }
+
+  if (!deepGet(spec, 'spec.dataSchema.timestampSpec')) {
+    return 'missing spec.dataSchema.timestampSpec';
+  }
+
+  if (!deepGet(spec, 'spec.dataSchema.dimensionsSpec')) {
+    return 'missing spec.dataSchema.dimensionsSpec';
+  }
+
+  if (!deepGet(spec, 'spec.dataSchema.granularitySpec.type')) {
+    return 'spec.dataSchema.granularitySpec.type';
+  }
+
+  return;
+}
+
 // --------------
 
 export interface DataSchema {
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index ebdca7e4adad..7ad0b53d9ebf 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -64,6 +64,7 @@ import {
   FILTERS_FIELDS,
   FLATTEN_FIELD_FIELDS,
   getDimensionSpecName,
+  getIssueWithSpec,
   getMetricSpecName,
   getTimestampExpressionFields,
   getTimestampSchema,
@@ -3148,13 +3149,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
 
   renderSpecStep() {
     const { spec, submitting } = this.state;
-
-    const fullSpec = Boolean(
-      deepGet(spec, 'spec.dataSchema.timestampSpec') &&
-        deepGet(spec, 'spec.dataSchema.dimensionsSpec') &&
-        deepGet(spec, 'spec.dataSchema.granularitySpec.type') &&
-        deepGet(spec, 'spec.dataSchema.dataSource'),
-    );
+    const issueWithSpec = getIssueWithSpec(spec);
 
     return (
       <>
@@ -3170,6 +3165,13 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
         </div>
         <div className="control">
           <SpecMessage />
+          {issueWithSpec && (
+            <FormGroup>
+              <Callout
+                intent={Intent.WARNING}
+              >{`There is an issue with the spec: ${issueWithSpec}`}</Callout>
+            </FormGroup>
+          )}
         </div>
         <div className="next-bar">
           {!isEmptyIngestionSpec(spec) && (
@@ -3184,7 +3186,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
             text="Submit"
             rightIcon={IconNames.CLOUD_UPLOAD}
             intent={Intent.PRIMARY}
-            disabled={submitting || !fullSpec}
+            disabled={submitting || Boolean(issueWithSpec)}
             onClick={this.handleSubmit}
           />
         </div>

From 1f02aff0638ff8a594594ba9fed13ec239dd6419 Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Tue, 8 Dec 2020 10:41:36 -0800
Subject: [PATCH 10/14] fixes

---
 web-console/src/utils/sampler.ts                        | 5 +++++
 web-console/src/views/load-data-view/load-data-view.tsx | 8 ++++++--
 2 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/web-console/src/utils/sampler.ts b/web-console/src/utils/sampler.ts
index 5f8b97eb34e5..6e534aa0acab 100644
--- a/web-console/src/utils/sampler.ts
+++ b/web-console/src/utils/sampler.ts
@@ -276,6 +276,7 @@ export async function sampleForConnect(
     ioConfig = deepSet(ioConfig, 'inputFormat', {
       type: 'regex',
       pattern: '(.*)',
+      listDelimiter: '56616469-6de2-9da4-efb8-8f416e6e6965', // Just a UUID to disable the list delimiter, let's hope we do not see this UUID in the data
       columns: ['raw'],
     });
   }
@@ -528,6 +529,9 @@ export async function sampleForFilter(
         dataSource: 'sample',
         timestampSpec,
         dimensionsSpec: specialDimensionSpec, // Hack Hack Hack
+        granularitySpec: {
+          intervals: deepGet(spec, 'spec.dataSchema.granularitySpec.intervals'),
+        },
         transformSpec: {
           transforms,
           filter,
@@ -562,6 +566,7 @@ export async function sampleForSchema(
         timestampSpec,
         transformSpec,
         granularitySpec: {
+          intervals: deepGet(spec, 'spec.dataSchema.granularitySpec.intervals'),
           queryGranularity,
         },
         dimensionsSpec,
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 7ad0b53d9ebf..66f124b79037 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -2069,7 +2069,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
   });
 
   renderFilterStep() {
-    const { spec, columnFilter, filterQueryState, selectedFilter } = this.state;
+    const { spec, specPreview, columnFilter, filterQueryState, selectedFilter } = this.state;
     const dimensionFilters = this.getMemoizedDimensionFiltersFromSpec(spec);
 
     let mainFill: JSX.Element | string = '';
@@ -2110,7 +2110,11 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
           <FilterMessage />
           {!selectedFilter && (
             <>
-              <AutoForm fields={FILTERS_FIELDS} model={spec} onChange={this.updateSpecPreview} />
+              <AutoForm
+                fields={FILTERS_FIELDS}
+                model={specPreview}
+                onChange={this.updateSpecPreview}
+              />
               {this.renderApplyButtonBar(filterQueryState, undefined)}
               <FormGroup>
                 <Button

From de7ec2761f7001024f2346925c15a50b4b7b5a41 Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Tue, 8 Dec 2020 11:05:42 -0800
Subject: [PATCH 11/14] fix default value

---
 .../numeric-input-with-default/numeric-input-with-default.tsx   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/web-console/src/components/numeric-input-with-default/numeric-input-with-default.tsx b/web-console/src/components/numeric-input-with-default/numeric-input-with-default.tsx
index f4d0b4e07990..fb731ac6f7db 100644
--- a/web-console/src/components/numeric-input-with-default/numeric-input-with-default.tsx
+++ b/web-console/src/components/numeric-input-with-default/numeric-input-with-default.tsx
@@ -29,7 +29,7 @@ export const NumericInputWithDefault = React.memo(function NumericInputWithDefau
 
   let effectiveValue = value;
   if (effectiveValue == null) {
-    effectiveValue = hasChanged ? '' : defaultValue || '';
+    effectiveValue = hasChanged ? '' : typeof defaultValue !== 'undefined' ? defaultValue : '';
   }
 
   return (

From 596a3b8fd9b654c2691eb583498b85057d7c663f Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Tue, 8 Dec 2020 13:03:15 -0800
Subject: [PATCH 12/14] move intervals back to partition step

---
 .../component/load-data/config/partition.ts   |  1 +
 .../component/load-data/data-loader.ts        |  5 ++-
 web-console/e2e-tests/reindexing.spec.ts      |  1 +
 web-console/e2e-tests/tutorial-batch.spec.ts  |  1 +
 .../__snapshots__/ingestion-spec.spec.ts.snap |  1 -
 web-console/src/druid-models/filter.tsx       | 36 ++++++++--------
 .../src/druid-models/ingestion-spec.spec.ts   |  4 --
 .../src/druid-models/ingestion-spec.tsx       | 42 ++++++++++++-------
 web-console/src/utils/sampler.ts              |  4 --
 web-console/src/utils/utils.spec.ts           |  2 -
 .../filter-table/filter-table.tsx             | 11 +++--
 .../views/load-data-view/load-data-view.tsx   | 22 +++-------
 12 files changed, 66 insertions(+), 64 deletions(-)

diff --git a/web-console/e2e-tests/component/load-data/config/partition.ts b/web-console/e2e-tests/component/load-data/config/partition.ts
index 14197bd86533..375ad550745f 100644
--- a/web-console/e2e-tests/component/load-data/config/partition.ts
+++ b/web-console/e2e-tests/component/load-data/config/partition.ts
@@ -164,6 +164,7 @@ export class PartitionConfig {
 
 interface PartitionConfigProps {
   readonly segmentGranularity: SegmentGranularity;
+  readonly timeIntervals: string | null;
   readonly partitionsSpec: PartitionsSpec | null;
 }
 
diff --git a/web-console/e2e-tests/component/load-data/data-loader.ts b/web-console/e2e-tests/component/load-data/data-loader.ts
index 8ee50a07ac3a..df16e7158753 100644
--- a/web-console/e2e-tests/component/load-data/data-loader.ts
+++ b/web-console/e2e-tests/component/load-data/data-loader.ts
@@ -18,7 +18,7 @@
 
 import * as playwright from 'playwright-chromium';
 
-import { clickButton, setLabeledInput } from '../../util/playwright';
+import { clickButton, setLabeledInput, setLabeledTextarea } from '../../util/playwright';
 
 import { ConfigureSchemaConfig } from './config/configure-schema';
 import { PartitionConfig } from './config/partition';
@@ -125,6 +125,9 @@ export class DataLoader {
 
   private async applyPartitionConfig(partitionConfig: PartitionConfig) {
     await setLabeledInput(this.page, 'Segment granularity', partitionConfig.segmentGranularity);
+    if (partitionConfig.timeIntervals) {
+      await setLabeledTextarea(this.page, 'Time intervals', partitionConfig.timeIntervals);
+    }
     if (partitionConfig.partitionsSpec != null) {
       await partitionConfig.partitionsSpec.apply(this.page);
     }
diff --git a/web-console/e2e-tests/reindexing.spec.ts b/web-console/e2e-tests/reindexing.spec.ts
index a935373b7833..a14262a8ab28 100644
--- a/web-console/e2e-tests/reindexing.spec.ts
+++ b/web-console/e2e-tests/reindexing.spec.ts
@@ -67,6 +67,7 @@ describe('Reindexing from Druid', () => {
     const configureSchemaConfig = new ConfigureSchemaConfig({ rollup: false });
     const partitionConfig = new PartitionConfig({
       segmentGranularity: SegmentGranularity.DAY,
+      timeIntervals: null,
       partitionsSpec: new SingleDimPartitionsSpec({
         partitionDimension: 'channel',
         targetRowsPerSegment: 10_000,
diff --git a/web-console/e2e-tests/tutorial-batch.spec.ts b/web-console/e2e-tests/tutorial-batch.spec.ts
index 2f4e06b8011a..f4fa45054632 100644
--- a/web-console/e2e-tests/tutorial-batch.spec.ts
+++ b/web-console/e2e-tests/tutorial-batch.spec.ts
@@ -64,6 +64,7 @@ describe('Tutorial: Loading a file', () => {
     const configureSchemaConfig = new ConfigureSchemaConfig({ rollup: false });
     const partitionConfig = new PartitionConfig({
       segmentGranularity: SegmentGranularity.DAY,
+      timeIntervals: null,
       partitionsSpec: null,
     });
     const publishConfig = new PublishConfig({ datasourceName: datasourceName });
diff --git a/web-console/src/druid-models/__snapshots__/ingestion-spec.spec.ts.snap b/web-console/src/druid-models/__snapshots__/ingestion-spec.spec.ts.snap
index 1008cb2112b3..be836323f121 100644
--- a/web-console/src/druid-models/__snapshots__/ingestion-spec.spec.ts.snap
+++ b/web-console/src/druid-models/__snapshots__/ingestion-spec.spec.ts.snap
@@ -16,7 +16,6 @@ Object {
         "queryGranularity": "hour",
         "rollup": true,
         "segmentGranularity": "day",
-        "type": "uniform",
       },
       "metricsSpec": Array [
         Object {
diff --git a/web-console/src/druid-models/filter.tsx b/web-console/src/druid-models/filter.tsx
index 2951dbd1905c..5c11784ec69e 100644
--- a/web-console/src/druid-models/filter.tsx
+++ b/web-console/src/druid-models/filter.tsx
@@ -75,16 +75,18 @@ export function getFilterDimension(filter: DruidFilter): string | undefined {
   return;
 }
 
+export const KNOWN_FILTER_TYPES = ['selector', 'in', 'interval', 'regex', 'like', 'not'];
+
 export const FILTER_FIELDS: Field<DruidFilter>[] = [
   {
     name: 'type',
     type: 'string',
-    suggestions: ['selector', 'in', 'regex', 'like', 'not'],
+    suggestions: KNOWN_FILTER_TYPES,
   },
   {
     name: 'dimension',
     type: 'string',
-    defined: (df: DruidFilter) => oneOf(df.type, 'selector', 'in', 'regex', 'like'),
+    defined: (df: DruidFilter) => oneOf(df.type, 'selector', 'in', 'interval', 'regex', 'like'),
   },
   {
     name: 'value',
@@ -96,6 +98,12 @@ export const FILTER_FIELDS: Field<DruidFilter>[] = [
     type: 'string-array',
     defined: (df: DruidFilter) => df.type === 'in',
   },
+  {
+    name: 'intervals',
+    type: 'string-array',
+    defined: (df: DruidFilter) => df.type === 'interval',
+    placeholder: 'ex: 2020-01-01/2020-06-01',
+  },
   {
     name: 'pattern',
     type: 'string',
@@ -106,7 +114,7 @@ export const FILTER_FIELDS: Field<DruidFilter>[] = [
     name: 'field.type',
     label: 'Sub-filter type',
     type: 'string',
-    suggestions: ['selector', 'in', 'regex', 'like'],
+    suggestions: ['selector', 'in', 'interval', 'regex', 'like'],
     defined: (df: DruidFilter) => df.type === 'not',
   },
   {
@@ -127,6 +135,13 @@ export const FILTER_FIELDS: Field<DruidFilter>[] = [
     type: 'string-array',
     defined: (df: DruidFilter) => df.type === 'not' && deepGet(df, 'field.type') === 'in',
   },
+  {
+    name: 'field.intervals',
+    label: 'Sub-filter intervals',
+    type: 'string-array',
+    defined: (df: DruidFilter) => df.type === 'not' && deepGet(df, 'field.type') === 'interval',
+    placeholder: 'ex: 2020-01-01/2020-06-01',
+  },
   {
     name: 'field.pattern',
     label: 'Sub-filter pattern',
@@ -137,21 +152,6 @@ export const FILTER_FIELDS: Field<DruidFilter>[] = [
 ];
 
 export const FILTERS_FIELDS: Field<IngestionSpec>[] = [
-  {
-    name: 'spec.dataSchema.granularitySpec.intervals',
-    label: 'Time intervals',
-    type: 'string-array',
-    placeholder: 'ex: 2020-01-01/2020-06-01',
-    info: (
-      <>
-        <p>A comma separated list of intervals for the raw data being ingested.</p>
-        <p>
-          Explicitly specifying the list of intervals contained in the data will make some ingestion
-          jobs run faster.
-        </p>
-      </>
-    ),
-  },
   {
     name: 'spec.dataSchema.transformSpec.filter',
     type: 'json',
diff --git a/web-console/src/druid-models/ingestion-spec.spec.ts b/web-console/src/druid-models/ingestion-spec.spec.ts
index 6193ae9de103..27b8aac64805 100644
--- a/web-console/src/druid-models/ingestion-spec.spec.ts
+++ b/web-console/src/druid-models/ingestion-spec.spec.ts
@@ -45,7 +45,6 @@ describe('ingestion-spec', () => {
       dataSchema: {
         dataSource: 'wikipedia',
         granularitySpec: {
-          type: 'uniform',
           segmentGranularity: 'day',
           queryGranularity: 'hour',
           rollup: true,
@@ -183,7 +182,6 @@ describe('spec utils', () => {
       dataSchema: {
         dataSource: 'wikipedia',
         granularitySpec: {
-          type: 'uniform',
           segmentGranularity: 'day',
           queryGranularity: 'hour',
         },
@@ -228,7 +226,6 @@ describe('spec utils', () => {
               "queryGranularity": "hour",
               "rollup": true,
               "segmentGranularity": "day",
-              "type": "uniform",
             },
             "metricsSpec": Array [
               Object {
@@ -286,7 +283,6 @@ describe('spec utils', () => {
               "queryGranularity": "none",
               "rollup": false,
               "segmentGranularity": "day",
-              "type": "uniform",
             },
             "timestampSpec": Object {
               "column": "timestamp",
diff --git a/web-console/src/druid-models/ingestion-spec.tsx b/web-console/src/druid-models/ingestion-spec.tsx
index 1cfd841a4d8c..d4c9bdca89fe 100644
--- a/web-console/src/druid-models/ingestion-spec.tsx
+++ b/web-console/src/druid-models/ingestion-spec.tsx
@@ -239,10 +239,6 @@ export function getIssueWithSpec(spec: IngestionSpec): string | undefined {
     return 'missing spec.dataSchema.dimensionsSpec';
   }
 
-  if (!deepGet(spec, 'spec.dataSchema.granularitySpec.type')) {
-    return 'spec.dataSchema.granularitySpec.type';
-  }
-
   return;
 }
 
@@ -1254,7 +1250,7 @@ function basenameFromFilename(filename: string): string | undefined {
 export function fillDataSourceNameIfNeeded(spec: IngestionSpec): IngestionSpec {
   const possibleName = guessDataSourceName(spec);
   if (!possibleName) return spec;
-  return deepSet(spec, 'spec.dataSchema.dataSource', possibleName);
+  return deepSetIfUnset(spec, 'spec.dataSchema.dataSource', possibleName);
 }
 
 export function guessDataSourceName(spec: IngestionSpec): string | undefined {
@@ -1387,7 +1383,6 @@ export const PRIMARY_PARTITION_RELATED_FORM_FIELDS: Field<IngestionSpec>[] = [
     label: 'Segment granularity',
     type: 'string',
     suggestions: ['hour', 'day', 'week', 'month', 'year'],
-    defined: s => deepGet(s, 'spec.dataSchema.granularitySpec.type') === 'uniform',
     required: true,
     info: (
       <>
@@ -1398,6 +1393,31 @@ export const PRIMARY_PARTITION_RELATED_FORM_FIELDS: Field<IngestionSpec>[] = [
       </>
     ),
   },
+  {
+    name: 'spec.dataSchema.granularitySpec.intervals',
+    label: 'Time intervals',
+    type: 'string-array',
+    placeholder: '(auto determine)',
+    defined: s => getSpecType(s) === 'index_parallel',
+    info: (
+      <>
+        <p>
+          A list of intervals describing what time chunks of segments should be created. This list
+          will be broken up and rounded-off based on the segmentGranularity.
+        </p>
+        <p>
+          If not provided, batch ingestion tasks will generally determine which time chunks to
+          output based on what timestamps are found in the input data.
+        </p>
+        <p>
+          If specified, batch ingestion tasks may be able to skip a determining-partitions phase,
+          which can result in faster ingestion. Batch ingestion tasks may also be able to request
+          all their locks up-front instead of one by one. Batch ingestion tasks will throw away any
+          records with timestamps outside of the specified intervals.
+        </p>
+      </>
+    ),
+  },
 ];
 
 export function getSecondaryPartitionRelatedFormFields(
@@ -1589,13 +1609,6 @@ export function getSecondaryPartitionRelatedFormFields(
   throw new Error(`unknown spec type ${specType}`);
 }
 
-export function settingIntervalsWouldSpeedUpIngestion(spec: IngestionSpec): boolean {
-  return (
-    oneOf(deepGet(spec, 'spec.tuningConfig.partitionsSpec.type'), 'hashed', 'single_dim') &&
-    !deepGet(spec, 'spec.dataSchema.granularitySpec.intervals')
-  );
-}
-
 const TUNING_FORM_FIELDS: Field<IngestionSpec>[] = [
   {
     name: 'spec.tuningConfig.maxNumConcurrentSubTasks',
@@ -2071,7 +2084,8 @@ export function issueWithSampleData(sampleData: string[]): JSX.Element | undefin
   return;
 }
 
-export function fillInputFormat(spec: IngestionSpec, sampleData: string[]): IngestionSpec {
+export function fillInputFormatIfNeeded(spec: IngestionSpec, sampleData: string[]): IngestionSpec {
+  if (deepGet(spec, 'spec.ioConfig.inputFormat.type')) return spec;
   return deepSet(spec, 'spec.ioConfig.inputFormat', guessInputFormat(sampleData));
 }
 
diff --git a/web-console/src/utils/sampler.ts b/web-console/src/utils/sampler.ts
index 6e534aa0acab..a279adc63ad5 100644
--- a/web-console/src/utils/sampler.ts
+++ b/web-console/src/utils/sampler.ts
@@ -529,9 +529,6 @@ export async function sampleForFilter(
         dataSource: 'sample',
         timestampSpec,
         dimensionsSpec: specialDimensionSpec, // Hack Hack Hack
-        granularitySpec: {
-          intervals: deepGet(spec, 'spec.dataSchema.granularitySpec.intervals'),
-        },
         transformSpec: {
           transforms,
           filter,
@@ -566,7 +563,6 @@ export async function sampleForSchema(
         timestampSpec,
         transformSpec,
         granularitySpec: {
-          intervals: deepGet(spec, 'spec.dataSchema.granularitySpec.intervals'),
           queryGranularity,
         },
         dimensionsSpec,
diff --git a/web-console/src/utils/utils.spec.ts b/web-console/src/utils/utils.spec.ts
index 31e2f89ab224..117ba069d3a9 100644
--- a/web-console/src/utils/utils.spec.ts
+++ b/web-console/src/utils/utils.spec.ts
@@ -40,7 +40,6 @@ describe('utils', () => {
       dataSchema: {
         dataSource: 'wikipedia',
         granularitySpec: {
-          type: 'uniform',
           segmentGranularity: 'day',
           queryGranularity: 'hour',
         },
@@ -91,7 +90,6 @@ describe('utils', () => {
             "granularitySpec": Object {
               "queryGranularity": "hour",
               "segmentGranularity": "day",
-              "type": "uniform",
             },
             "timestampSpec": Object {
               "column": "timestamp",
diff --git a/web-console/src/views/load-data-view/filter-table/filter-table.tsx b/web-console/src/views/load-data-view/filter-table/filter-table.tsx
index 97958b456a60..e9da226aa35e 100644
--- a/web-console/src/views/load-data-view/filter-table/filter-table.tsx
+++ b/web-console/src/views/load-data-view/filter-table/filter-table.tsx
@@ -65,14 +65,17 @@ export const FilterTable = React.memo(function FilterTable(props: FilterTablePro
         return {
           Header: (
             <div
-              className={classNames({ clickable: !timestamp })}
+              className="clickable"
               onClick={() => {
-                if (timestamp) return;
-
                 if (filter) {
                   onFilterSelect(filter, filterIndex);
                 } else {
-                  onFilterSelect({ type: 'selector', dimension: columnName, value: '' }, -1);
+                  onFilterSelect(
+                    timestamp
+                      ? { type: 'interval', dimension: columnName, intervals: [] }
+                      : { type: 'selector', dimension: columnName, value: '' },
+                    -1,
+                  );
                 }
               }}
             >
diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 66f124b79037..971634718f59 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -70,10 +70,10 @@ import {
   getTimestampSchema,
   INPUT_FORMAT_FIELDS,
   issueWithSampleData,
+  KNOWN_FILTER_TYPES,
   METRIC_SPEC_FIELDS,
   PRIMARY_PARTITION_RELATED_FORM_FIELDS,
   removeTimestampTransform,
-  settingIntervalsWouldSpeedUpIngestion,
   TIMESTAMP_SPEC_FIELDS,
   TimestampSpec,
   Transform,
@@ -88,7 +88,7 @@ import {
   DimensionSpec,
   DruidFilter,
   fillDataSourceNameIfNeeded,
-  fillInputFormat,
+  fillInputFormatIfNeeded,
   FlattenField,
   getDimensionMode,
   getIngestionComboType,
@@ -129,7 +129,6 @@ import {
   deepDelete,
   deepGet,
   deepSet,
-  deepSetIfUnset,
   deepSetMulti,
   EMPTY_ARRAY,
   EMPTY_OBJECT,
@@ -1287,7 +1286,9 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
                 return false;
               }
 
-              this.updateSpec(fillDataSourceNameIfNeeded(fillInputFormat(spec, sampleLines)));
+              this.updateSpec(
+                fillDataSourceNameIfNeeded(fillInputFormatIfNeeded(spec, sampleLines)),
+              );
             }
             return true;
           },
@@ -1902,8 +1903,6 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
               );
             }
 
-            newSpec = deepSetIfUnset(newSpec, 'spec.dataSchema.granularitySpec.type', 'uniform');
-
             this.updateSpec(newSpec);
             return true;
           },
@@ -2160,7 +2159,7 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
           fields={FILTER_FIELDS}
           model={selectedFilter}
           onChange={f => this.setState({ selectedFilter: f })}
-          showCustom={f => !oneOf(f.type, 'selector', 'in', 'regex', 'like', 'not')}
+          showCustom={f => !KNOWN_FILTER_TYPES.includes(f.type)}
         />
         <div className="control-buttons">
           <Button
@@ -2936,15 +2935,6 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
         <div className="control">
           <PartitionMessage />
           {nonsensicalSingleDimPartitioningMessage}
-          {settingIntervalsWouldSpeedUpIngestion(spec) && (
-            <FormGroup>
-              <Callout icon={IconNames.LIGHTBULB}>
-                You can make this ingestion run slightly faster by explicitly specifying the time
-                intervals for this dataset from the{' '}
-                <a onClick={() => this.updateStep('filter')}>Filter</a> step.
-              </Callout>
-            </FormGroup>
-          )}
         </div>
         {this.renderNextBar({
           disabled: invalidPartitionConfig(spec),

From 4696d9c13d873b5a22a9ee00cc57a401617278ea Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Tue, 8 Dec 2020 15:15:17 -0800
Subject: [PATCH 13/14] work with all sorts of chars

---
 web-console/e2e-tests/tutorial-batch.spec.ts |  9 ++++++---
 web-console/src/singletons/api.spec.ts       |  2 +-
 web-console/src/singletons/api.ts            | 10 +++++++++-
 3 files changed, 16 insertions(+), 5 deletions(-)

diff --git a/web-console/e2e-tests/tutorial-batch.spec.ts b/web-console/e2e-tests/tutorial-batch.spec.ts
index f4fa45054632..842d7a50182e 100644
--- a/web-console/e2e-tests/tutorial-batch.spec.ts
+++ b/web-console/e2e-tests/tutorial-batch.spec.ts
@@ -16,13 +16,14 @@
  * limitations under the License.
  */
 
+import { SqlRef } from 'druid-query-toolkit';
 import * as playwright from 'playwright-chromium';
 
 import { DatasourcesOverview } from './component/datasources/overview';
 import { IngestionOverview } from './component/ingestion/overview';
 import { ConfigureSchemaConfig } from './component/load-data/config/configure-schema';
-import { PartitionConfig } from './component/load-data/config/partition';
 import { SegmentGranularity } from './component/load-data/config/partition';
+import { PartitionConfig } from './component/load-data/config/partition';
 import { PublishConfig } from './component/load-data/config/publish';
 import { LocalFileDataConnector } from './component/load-data/data-connector/local-file';
 import { DataLoader } from './component/load-data/data-loader';
@@ -37,6 +38,8 @@ import { waitTillWebConsoleReady } from './util/setup';
 
 jest.setTimeout(5 * 60 * 1000);
 
+const ALL_SORTS_OF_CHARS = '<>|!@#$%^&`\'".,:;\\*()[]{}Россия 한국 中国!?~';
+
 describe('Tutorial: Loading a file', () => {
   let browser: playwright.Browser;
   let page: playwright.Page;
@@ -56,7 +59,7 @@ describe('Tutorial: Loading a file', () => {
 
   it('Loads data from local disk', async () => {
     const testName = 'load-data-from-local-disk-';
-    const datasourceName = testName + new Date().toISOString();
+    const datasourceName = testName + ALL_SORTS_OF_CHARS + new Date().toISOString();
     const dataConnector = new LocalFileDataConnector(page, {
       baseDirectory: DRUID_EXAMPLES_QUICKSTART_TUTORIAL_DIR,
       fileFilter: 'wikiticker-2015-09-12-sampled.json.gz',
@@ -168,7 +171,7 @@ async function validateDatasourceStatus(page: playwright.Page, datasourceName: s
 
 async function validateQuery(page: playwright.Page, datasourceName: string) {
   const queryOverview = new QueryOverview(page, UNIFIED_CONSOLE_URL);
-  const query = `SELECT * FROM "${datasourceName}" ORDER BY __time`;
+  const query = `SELECT * FROM ${SqlRef.table(datasourceName)} ORDER BY __time`;
   const results = await queryOverview.runQuery(query);
   expect(results).toBeDefined();
   expect(results.length).toBeGreaterThan(0);
diff --git a/web-console/src/singletons/api.spec.ts b/web-console/src/singletons/api.spec.ts
index 64429af4023f..8cb8581b1736 100644
--- a/web-console/src/singletons/api.spec.ts
+++ b/web-console/src/singletons/api.spec.ts
@@ -21,6 +21,6 @@ import { Api } from './api';
 describe('Api', () => {
   it('escapes stuff', () => {
     expect(Api.encodePath('wikipedia')).toEqual('wikipedia');
-    expect(Api.encodePath('wi%ki?pe#dia')).toEqual('wi%25ki%3Fpe%23dia');
+    expect(Api.encodePath(`wi%ki?pe#dia&'[]`)).toEqual('wi%25ki%3Fpe%23dia%26%27%5B%5D');
   });
 });
diff --git a/web-console/src/singletons/api.ts b/web-console/src/singletons/api.ts
index a05adf324610..7a05bdd398c8 100644
--- a/web-console/src/singletons/api.ts
+++ b/web-console/src/singletons/api.ts
@@ -46,6 +46,14 @@ export class Api {
   }
 
   static encodePath(path: string): string {
-    return path.replace(/[?#%]/g, encodeURIComponent);
+    return path.replace(
+      /[?#%&'\[\]]/g,
+      c =>
+        '%' +
+        c
+          .charCodeAt(0)
+          .toString(16)
+          .toUpperCase(),
+    );
   }
 }

From 6f14ed257eb59a07ed402cff6da3f65887db9395 Mon Sep 17 00:00:00 2001
From: Vadim Ogievetsky <vadim@ogievetsky.com>
Date: Tue, 8 Dec 2020 18:17:12 -0800
Subject: [PATCH 14/14] fix enabled view

---
 web-console/src/views/load-data-view/load-data-view.tsx | 9 +--------
 1 file changed, 1 insertion(+), 8 deletions(-)

diff --git a/web-console/src/views/load-data-view/load-data-view.tsx b/web-console/src/views/load-data-view/load-data-view.tsx
index 971634718f59..ff7db4d6d2e1 100644
--- a/web-console/src/views/load-data-view/load-data-view.tsx
+++ b/web-console/src/views/load-data-view/load-data-view.tsx
@@ -470,20 +470,13 @@ export class LoadDataView extends React.PureComponent<LoadDataViewProps, LoadDat
         return Boolean(cacheRows && deepGet(spec, 'spec.dataSchema.timestampSpec'));
 
       case 'schema':
-        return Boolean(
-          cacheRows &&
-            deepGet(spec, 'spec.dataSchema.timestampSpec') &&
-            deepGet(spec, 'spec.dataSchema.dimensionsSpec'),
-        );
-
       case 'partition':
       case 'tuning':
       case 'publish':
         return Boolean(
           cacheRows &&
             deepGet(spec, 'spec.dataSchema.timestampSpec') &&
-            deepGet(spec, 'spec.dataSchema.dimensionsSpec') &&
-            deepGet(spec, 'spec.dataSchema.granularitySpec.type'),
+            deepGet(spec, 'spec.dataSchema.dimensionsSpec'),
         );
 
       default: