apache · leventov · May 3, 2019 · Feb 19, 2019 · Feb 23, 2019 · Feb 23, 2019
diff --git a/docs/content/configuration/index.md b/docs/content/configuration/index.md
@@ -1254,8 +1254,8 @@ These Historical configurations can be defined in the `historical/runtime.proper
 |`druid.segmentCache.dropSegmentDelayMillis`|How long a process delays before completely dropping segment.|30000 (30 seconds)|
 |`druid.segmentCache.infoDir`|Historical processes keep track of the segments they are serving so that when the process is restarted they can reload the same segments without waiting for the Coordinator to reassign. This path defines where this metadata is kept. Directory will be created if needed.|${first_location}/info_dir|
 |`druid.segmentCache.announceIntervalMillis`|How frequently to announce segments while segments are loading from cache. Set this value to zero to wait for all segments to be loaded before announcing.|5000 (5 seconds)|
-|`druid.segmentCache.numLoadingThreads`|How many segments to drop or load concurrently from from deep storage.|10|
-|`druid.segmentCache.numBootstrapThreads`|How many segments to load concurrently from local storage at startup.|Same as numLoadingThreads|
+|`druid.segmentCache.numLoadingThreads`|How many segments to drop or load concurrently from deep storage. Note that the work of loading segments involves downloading segments from deep storage, decompressing them and loading them to a memory mapped location. So the work is not all I/O Bound. Depending on CPU and network load, one could possibly increase this config to a higher value.|Number of cores|
+|`druid.coordinator.loadqueuepeon.curator.numCallbackThreads`|Number of threads for executing callback actions associated with loading or dropping of segments. One might want to increase this number when noticing clusters are lagging behind w.r.t. balancing segments across historical nodes.|2|
 
 In `druid.segmentCache.locations`, *freeSpacePercent* was added because *maxSize* setting is only a theoretical limit and assumes that much space will always be available for storing segments. In case of any druid bug leading to unaccounted segment files left alone on disk or some other process writing stuff to disk, This check can start failing segment loading early before filling up the disk completely and leaving the host usable otherwise.
 

diff --git a/server/src/main/java/org/apache/druid/segment/loading/SegmentLoaderConfig.java b/server/src/main/java/org/apache/druid/segment/loading/SegmentLoaderConfig.java
@@ -22,6 +22,7 @@
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.google.common.collect.Lists;
 import org.apache.druid.java.util.common.ISE;
+import org.apache.druid.utils.JvmUtils;
 import org.hibernate.validator.constraints.NotEmpty;
 
 import java.io.File;
@@ -46,7 +47,7 @@ public class SegmentLoaderConfig
   private int announceIntervalMillis = 0; // do not background announce
 
   @JsonProperty("numLoadingThreads")
-  private int numLoadingThreads = 10;
+  private int numLoadingThreads = JvmUtils.getRuntimeInfo().getAvailableProcessors();
 
   @JsonProperty("numBootstrapThreads")
   private Integer numBootstrapThreads = null;

diff --git a/server/src/main/java/org/apache/druid/server/coordination/ZkCoordinator.java b/server/src/main/java/org/apache/druid/server/coordination/ZkCoordinator.java
@@ -32,9 +32,11 @@
 import org.apache.druid.java.util.common.lifecycle.LifecycleStart;
 import org.apache.druid.java.util.common.lifecycle.LifecycleStop;
 import org.apache.druid.java.util.emitter.EmittingLogger;
+import org.apache.druid.segment.loading.SegmentLoaderConfig;
 import org.apache.druid.server.initialization.ZkPathsConfig;
 
 import java.io.IOException;
+import java.util.concurrent.ExecutorService;
 
 /**
  * Use {@link org.apache.druid.server.coordinator.HttpLoadQueuePeon} for segment load/drops.
@@ -54,21 +56,27 @@ public class ZkCoordinator
 
   private volatile PathChildrenCache loadQueueCache;
   private volatile boolean started = false;
+  private final ExecutorService segmentLoadUnloadService;
 
   @Inject
   public ZkCoordinator(
       SegmentLoadDropHandler loadDropHandler,
       ObjectMapper jsonMapper,
       ZkPathsConfig zkPaths,
       DruidServerMetadata me,
-      CuratorFramework curator
+      CuratorFramework curator,
+      SegmentLoaderConfig config
   )
   {
     this.dataSegmentChangeHandler = loadDropHandler;
     this.jsonMapper = jsonMapper;
     this.zkPaths = zkPaths;
     this.me = me;
     this.curator = curator;
+    this.segmentLoadUnloadService = Execs.multiThreaded(
+        config.getNumLoadingThreads(),
+        "ZKCoordinator--%d"
+    );
   }
 
   @LifecycleStart
@@ -102,63 +110,12 @@ public void start() throws IOException
             new PathChildrenCacheListener()
             {
               @Override
-              public void childEvent(CuratorFramework client, PathChildrenCacheEvent event) throws Exception
+              public void childEvent(CuratorFramework client, PathChildrenCacheEvent event)
               {
                 final ChildData child = event.getData();
                 switch (event.getType()) {
                   case CHILD_ADDED:
-                    final String path = child.getPath();
-                    final DataSegmentChangeRequest request = jsonMapper.readValue(
-                        child.getData(), DataSegmentChangeRequest.class
-                    );
-
-                    log.info("New request[%s] with zNode[%s].", request.asString(), path);
-
-                    try {
-                      request.go(
-                          dataSegmentChangeHandler,
-                          new DataSegmentChangeCallback()
-                          {
-                            boolean hasRun = false;
-
-                            @Override
-                            public void execute()
-                            {
-                              try {
-                                if (!hasRun) {
-                                  curator.delete().guaranteed().forPath(path);
-                                  log.info("Completed request [%s]", request.asString());
-                                  hasRun = true;
-                                }
-                              }
-                              catch (Exception e) {
-                                try {
-                                  curator.delete().guaranteed().forPath(path);
-                                }
-                                catch (Exception e1) {
-                                  log.error(e1, "Failed to delete zNode[%s], but ignoring exception.", path);
-                                }
-                                log.error(e, "Exception while removing zNode[%s]", path);
-                                throw new RuntimeException(e);
-                              }
-                            }
-                          }
-                      );
-                    }
-                    catch (Exception e) {
-                      try {
-                        curator.delete().guaranteed().forPath(path);
-                      }
-                      catch (Exception e1) {
-                        log.error(e1, "Failed to delete zNode[%s], but ignoring exception.", path);
-                      }
-
-                      log.makeAlert(e, "Segment load/unload: uncaught exception.")
-                         .addData("node", path)
-                         .addData("nodeProperties", request)
-                         .emit();
-                    }
-
+                    childAdded(child);
                     break;
                   case CHILD_REMOVED:
                     log.info("zNode[%s] was removed", event.getData().getPath());
@@ -168,6 +125,7 @@ public void execute()
                 }
               }
             }
+
         );
         loadQueueCache.start();
       }
@@ -180,6 +138,59 @@ public void execute()
     }
   }
 
+  private void childAdded(ChildData child)
+  {
+    segmentLoadUnloadService.submit(() -> {
+      final String path = child.getPath();
+      DataSegmentChangeRequest request = new SegmentChangeRequestNoop();
+      try {
+        final DataSegmentChangeRequest finalRequest = jsonMapper.readValue(
+            child.getData(),
+            DataSegmentChangeRequest.class
+        );
+
+        finalRequest.go(
+            dataSegmentChangeHandler,
+            new DataSegmentChangeCallback()
+            {
+              @Override
+              public void execute()
+              {
+                try {
+                  curator.delete().guaranteed().forPath(path);
+                  log.info("Completed request [%s]", finalRequest.asString());
+                }
+                catch (Exception e) {
+                  try {
+                    curator.delete().guaranteed().forPath(path);
+                  }
+                  catch (Exception e1) {
+                    log.error(e1, "Failed to delete zNode[%s], but ignoring exception.", path);
+                  }
+                  log.error(e, "Exception while removing zNode[%s]", path);
+                  throw new RuntimeException(e);
+                }
+              }
+            }
+        );
+      }
+      catch (Exception e) {
+        // Something went wrong in either deserializing the request using jsonMapper or when invoking it
+        try {
+          curator.delete().guaranteed().forPath(path);
+        }
+        catch (Exception e1) {
+          log.error(e1, "Failed to delete zNode[%s], but ignoring exception.", path);
+        }
+
+        log.makeAlert(e, "Segment load/unload: uncaught exception.")
+           .addData("node", path)
+           .addData("nodeProperties", request)
+           .emit();
+      }
+    });
+  }
+
   @LifecycleStop
   public void stop()
   {