Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
49 commits
Select commit Hold shift + click to select a range
aea7754
Bound memory in native batch ingest create segments
Apr 16, 2021
1558ce7
Move BatchAppenderatorDriverTest to indexing service... note that we …
May 22, 2021
e3946fc
Remove sinks from memory and clean up intermediate persists dirs manu…
May 24, 2021
4e8d573
Changed name from RealtimeAppenderator to StreamAppenderator
May 25, 2021
b20582f
Style
May 25, 2021
eec4f39
Incorporating tests from StreamAppenderatorTest
May 26, 2021
30e1ec3
Keep totalRows and cleanup code
May 29, 2021
00922d7
Added missing dep
May 29, 2021
00dd32b
Fix unit test
May 29, 2021
864357d
Checkstyle
Jun 1, 2021
2fa2a9d
allowIncrementalPersists should always be true for batch
Jun 1, 2021
5b0157b
Added sinks metadata
Jun 1, 2021
0312763
clear sinks metadata when closing appenderator
Jun 1, 2021
e308d68
Style + minor edits to log msgs
Jun 2, 2021
e55c40e
Update sinks metadata & totalRows when dropping a sink (segment)
Jun 2, 2021
4bb61a7
Remove max
Jun 2, 2021
dddd4e4
Intelli-j check
Jun 3, 2021
19bdee0
Keep a count of hydrants persisted by sink for sanity check before merge
Jun 3, 2021
f1211f0
Move out sanity
Jun 4, 2021
1f37d5d
Add previous hydrant count to sink metadata
Jun 4, 2021
e0c3e16
Remove redundant field from SinkMetadata
Jun 4, 2021
4fb1f47
Remove unneeded functions
Jun 4, 2021
10264dc
Cleanup unused code
Jun 4, 2021
f74baaf
Removed unused code
Jun 4, 2021
34cffcf
Remove unused field
Jun 4, 2021
fac1ca1
Exclude it from jacoco because it is very hard to get branch coverage
Jun 5, 2021
af93370
Remove segment announcement and some other minor cleanup
Jun 7, 2021
a019433
Add fallback flag
Jun 7, 2021
a296703
Minor code cleanup
Jun 22, 2021
a645041
Checkstyle
Jun 22, 2021
728dbb9
Merge branch 'master' into bound-mem-dynamic
Jun 24, 2021
2b321f5
Code review changes
Jun 25, 2021
afb6141
Update batchMemoryMappedIndex name
Jun 25, 2021
8077c01
Code review comments
Jul 1, 2021
2c71c7d
Exclude class from coverage, will include again when packaging gets f…
Jul 1, 2021
ff5e2ed
Moved test classes to server module
Jul 1, 2021
34e1342
More BatchAppenderator cleanup
Jul 2, 2021
dfcdf8f
Fix bug in wrong counting of totalHydrants plus minor cleanup in add
Jul 2, 2021
3e7fcff
Removed left over comments
Jul 2, 2021
d082d01
Have BatchAppenderator follow the Appenderator contract for push & ge…
Jul 2, 2021
62e4ac3
Merge branch 'master' into bound-mem-dynamic
Jul 2, 2021
6704a25
Fix LGTM violations
Jul 3, 2021
3f274c1
Review comments
Jul 6, 2021
cea716a
Add stats after push is done
Jul 6, 2021
1f267a8
Code review comments (cleanup, remove rest of synchronization constru…
Jul 8, 2021
291039e
Update javadocs
Jul 8, 2021
daf233b
Add thread safety notice to BatchAppenderator
Jul 8, 2021
0dedc87
Further cleanup config
Jul 9, 2021
effe090
More config cleanup
Jul 9, 2021
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion docs/configuration/index.md
Original file line number Diff line number Diff line change
Expand Up @@ -1334,7 +1334,7 @@ Additional peon configs include:
|`druid.peon.mode`|Choices are "local" and "remote". Setting this to local means you intend to run the peon as a standalone process (Not recommended).|remote|
|`druid.indexer.task.baseDir`|Base temporary working directory.|`System.getProperty("java.io.tmpdir")`|
|`druid.indexer.task.baseTaskDir`|Base temporary working directory for tasks.|`${druid.indexer.task.baseDir}/persistent/task`|
|`druid.indexer.task.batchMemoryMappedIndex`|If false, native batch ingestion will not map indexes thus saving heap space. This does not apply to streaming ingestion, just to batch. This setting should only be used when a bug is suspected or found in the new batch ingestion code that avoids memory mapping indices. If a bug is suspected or found, you can set this flag to `true` to fall back to previous, working but more memory intensive, code path.|`false`|
|`druid.indexer.task.useLegacyBatchProcessing`|If false, native batch ingestion will use a new, recommended, code path with memory optimized code for the segment creation phase. If true it will use the previous code path for the create segments phase of batch ingestion. This does not apply to streaming ingestion, just to batch. This setting should only be used when a bug is suspected or found in the new optimized batch ingestion code. If a bug is suspected or found, you can set this flag to `true` to fall back to previous, working but more memory intensive, code path.|`false`|
|`druid.indexer.task.defaultHadoopCoordinates`|Hadoop version to use with HadoopIndexTasks that do not request a particular version.|org.apache.hadoop:hadoop-client:2.8.5|
|`druid.indexer.task.defaultRowFlushBoundary`|Highest row count before persisting to disk. Used for indexing generating tasks.|75000|
|`druid.indexer.task.directoryLockTimeout`|Wait this long for zombie peons to exit before giving up on their replacements.|PT10M|
Expand Down
11 changes: 5 additions & 6 deletions indexing-service/pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -62,11 +62,6 @@
<artifactId>druid-hll</artifactId>
<version>${project.parent.version}</version>
</dependency>
<dependency>
<groupId>org.apache.commons</groupId>
<artifactId>commons-collections4</artifactId>
<version>4.2</version>
</dependency>
<dependency>
<groupId>io.dropwizard.metrics</groupId>
<artifactId>metrics-core</artifactId>
Expand Down Expand Up @@ -232,7 +227,11 @@
<artifactId>jackson-core-asl</artifactId>
<scope>provided</scope>
</dependency>

<dependency>
<groupId>org.apache.commons</groupId>
<artifactId>commons-collections4</artifactId>
<scope>provided</scope>
</dependency>
<!-- Tests -->
<dependency>
<groupId>junit</groupId>
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -77,7 +77,7 @@ public class TaskConfig
private final boolean ignoreTimestampSpecForDruidInputSource;

@JsonProperty
private final boolean batchMemoryMappedIndex;
private final boolean useLegacyBatchProcessing;

@JsonCreator
public TaskConfig(
Expand All @@ -91,7 +91,7 @@ public TaskConfig(
@JsonProperty("directoryLockTimeout") Period directoryLockTimeout,
@JsonProperty("shuffleDataLocations") List<StorageLocationConfig> shuffleDataLocations,
@JsonProperty("ignoreTimestampSpecForDruidInputSource") boolean ignoreTimestampSpecForDruidInputSource,
@JsonProperty("batchMemoryMappedIndex") boolean batchMemoryMapIndex // only set to true to fall back to older behavior
@JsonProperty("useLegacyBatchProcessing") boolean useLegacyBatchProcessing // only set to true to fall back to older behavior
)
{
this.baseDir = baseDir == null ? System.getProperty("java.io.tmpdir") : baseDir;
Expand All @@ -117,7 +117,7 @@ public TaskConfig(
this.shuffleDataLocations = shuffleDataLocations;
}
this.ignoreTimestampSpecForDruidInputSource = ignoreTimestampSpecForDruidInputSource;
this.batchMemoryMappedIndex = batchMemoryMapIndex;
this.useLegacyBatchProcessing = useLegacyBatchProcessing;
}

@JsonProperty
Expand Down Expand Up @@ -201,9 +201,9 @@ public boolean isIgnoreTimestampSpecForDruidInputSource()
}

@JsonProperty
public boolean getBatchMemoryMappedIndex()
public boolean getuseLegacyBatchProcessing()
{
return batchMemoryMappedIndex;
return useLegacyBatchProcessing;
}


Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -81,7 +81,7 @@ public static Appenderator newAppenderator(
toolbox.getIndexMergerV9(),
rowIngestionMeters,
parseExceptionHandler,
toolbox.getConfig().getBatchMemoryMappedIndex()
toolbox.getConfig().getuseLegacyBatchProcessing()
);
}

Expand Down

This file was deleted.

Loading