Fix maxBytesInMemory for heap overhead of all sinks and hydrants check (#10891)

* fix maxBytesInMemory * fix maxBytesInMemory check * fix maxBytesInMemory check * fix test
2021-02-18 21:48:57 -08:00 · 2021-02-18 21:48:57 -08:00 · f5bfccc720
parent cbbef80c7f
commit f5bfccc720
2 changed files with 45 additions and 39 deletions
--- a/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorImpl.java
+++ b/server/src/main/java/org/apache/druid/segment/realtime/appenderator/AppenderatorImpl.java
@ -332,6 +332,47 @@ public class AppenderatorImpl implements Appenderator
      if (allowIncrementalPersists) {
        // persistAll clears rowsCurrentlyInMemory, no need to update it.
        log.info("Flushing in-memory data to disk because %s.", String.join(",", persistReasons));
        long bytesPersisted = 0L;
        for (Map.Entry<SegmentIdWithShardSpec, Sink> entry : sinks.entrySet()) {
          final Sink sinkEntry = entry.getValue();
          if (sinkEntry != null) {
            bytesPersisted += sinkEntry.getBytesInMemory();
            if (sinkEntry.swappable()) {
              // After swapping the sink, we use memory mapped segment instead. However, the memory mapped segment still consumes memory.
              // These memory mapped segments are held in memory throughout the ingestion phase and permanently add to the bytesCurrentlyInMemory
              int memoryStillInUse = calculateMMappedHydrantMemoryInUsed(sink.getCurrHydrant());
              bytesCurrentlyInMemory.addAndGet(memoryStillInUse);
            }
          }
        }
        if (!skipBytesInMemoryOverheadCheck && bytesCurrentlyInMemory.get() - bytesPersisted > maxBytesTuningConfig) {
          // We are still over maxBytesTuningConfig even after persisting.
          // This means that we ran out of all available memory to ingest (due to overheads created as part of ingestion)
          final String alertMessage = StringUtils.format(
              "Task has exceeded safe estimated heap usage limits, failing "
              + "(numSinks: [%d] numHydrantsAcrossAllSinks: [%d] totalRows: [%d])",
              sinks.size(),
              sinks.values().stream().mapToInt(Iterables::size).sum(),
              getTotalRowCount()
          );
          final String errorMessage = StringUtils.format(
              "%s.\nThis can occur when the overhead from too many intermediary segment persists becomes to "
              + "great to have enough space to process additional input rows. This check, along with metering the overhead "
              + "of these objects to factor into the 'maxBytesInMemory' computation, can be disabled by setting "
              + "'skipBytesInMemoryOverheadCheck' to 'true' (note that doing so might allow the task to naturally encounter "
              + "a 'java.lang.OutOfMemoryError'). Alternatively, 'maxBytesInMemory' can be increased which will cause an "
              + "increase in heap footprint, but will allow for more intermediary segment persists to occur before "
              + "reaching this condition.",
              alertMessage
          );
          log.makeAlert(alertMessage)
             .addData("dataSource", schema.getDataSource())
             .emit();
          throw new RuntimeException(errorMessage);
        }
        Futures.addCallback(
            persistAll(committerSupplier == null ? null : committerSupplier.get()),
            new FutureCallback<Object>()
@ -513,7 +554,6 @@ public class AppenderatorImpl implements Appenderator
  public ListenableFuture<Object> persistAll(@Nullable final Committer committer)
  {
    throwPersistErrorIfExists();
    long bytesInMemoryBeforePersist = bytesCurrentlyInMemory.get();
    final Map<String, Integer> currentHydrants = new HashMap<>();
    final List<Pair<FireHydrant, SegmentIdWithShardSpec>> indexesToPersist = new ArrayList<>();
    int numPersistedRows = 0;
@ -539,16 +579,9 @@ public class AppenderatorImpl implements Appenderator
      }
      if (sink.swappable()) {
        // After swapping the sink, we use memory mapped segment instead. However, the memory mapped segment still consumes memory.
        // These memory mapped segments are held in memory throughout the ingestion phase and permanently add to the bytesCurrentlyInMemory
        int memoryStillInUse = calculateMMappedHydrantMemoryInUsed(sink.getCurrHydrant());
        bytesCurrentlyInMemory.addAndGet(memoryStillInUse);
        indexesToPersist.add(Pair.of(sink.swap(), identifier));
      }
    }
    log.debug("Submitting persist runnable for dataSource[%s]", schema.getDataSource());
    final Object commitMetadata = committer == null ? null : committer.getMetadata();
@ -638,33 +671,6 @@ public class AppenderatorImpl implements Appenderator
    log.info("Persisted rows[%,d] and bytes[%,d]", numPersistedRows, bytesPersisted);
    // bytesCurrentlyInMemory can change while persisting due to concurrent ingestion.
    // Hence, we use bytesInMemoryBeforePersist to determine the change of this persist
    if (!skipBytesInMemoryOverheadCheck && bytesInMemoryBeforePersist - bytesPersisted > maxBytesTuningConfig) {
      // We are still over maxBytesTuningConfig even after persisting.
      // This means that we ran out of all available memory to ingest (due to overheads created as part of ingestion)
      final String alertMessage = StringUtils.format(
          "Task has exceeded safe estimated heap usage limits, failing "
          + "(numSinks: [%d] numHydrantsAcrossAllSinks: [%d] totalRows: [%d])",
          sinks.size(),
          sinks.values().stream().mapToInt(Iterables::size).sum(),
          getTotalRowCount()
      );
      final String errorMessage = StringUtils.format(
          "%s.\nThis can occur when the overhead from too many intermediary segment persists becomes to "
          + "great to have enough space to process additional input rows. This check, along with metering the overhead "
          + "of these objects to factor into the 'maxBytesInMemory' computation, can be disabled by setting "
          + "'skipBytesInMemoryOverheadCheck' to 'true' (note that doing so might allow the task to naturally encounter "
          + "a 'java.lang.OutOfMemoryError'). Alternatively, 'maxBytesInMemory' can be increased which will cause an "
          + "increase in heap footprint, but will allow for more intermediary segment persists to occur before "
          + "reaching this condition.",
          alertMessage
      );
      log.makeAlert(alertMessage)
         .addData("dataSource", schema.getDataSource())
         .emit();
      throw new RuntimeException(errorMessage);
    }
    return future;
  }
--- a/server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorTest.java
+++ b/server/src/test/java/org/apache/druid/segment/realtime/appenderator/AppenderatorTest.java
@ -257,7 +257,7 @@ public class AppenderatorTest extends InitializedNullHandlingTest
  @Test
  public void testMaxBytesInMemory() throws Exception
  {
-    try (final AppenderatorTester tester = new AppenderatorTester(100, 10000, true)) {
+    try (final AppenderatorTester tester = new AppenderatorTester(100, 15000, true)) {
      final Appenderator appenderator = tester.getAppenderator();
      final AtomicInteger eventCount = new AtomicInteger(0);
      final Supplier<Committer> committerSupplier = () -> {
@ -297,7 +297,7 @@ public class AppenderatorTest extends InitializedNullHandlingTest
      );
      // We do multiple more adds to the same sink to cause persist.
-      for (int i = 0; i < 26; i++) {
+      for (int i = 0; i < 53; i++) {
        appenderator.add(IDENTIFIERS.get(0), ir("2000", "bar_" + i, 1), committerSupplier);
      }
      sinkSizeOverhead = 1 * AppenderatorImpl.ROUGH_OVERHEAD_PER_SINK;
@ -333,7 +333,7 @@ public class AppenderatorTest extends InitializedNullHandlingTest
      );
      // We do multiple more adds to the same sink to cause persist.
-      for (int i = 0; i < 5; i++) {
+      for (int i = 0; i < 31; i++) {
        appenderator.add(IDENTIFIERS.get(0), ir("2000", "bar_" + i, 1), committerSupplier);
      }
      // currHydrant size is 0 since we just persist all indexes to disk.
@ -363,7 +363,7 @@ public class AppenderatorTest extends InitializedNullHandlingTest
  @Test(expected = RuntimeException.class)
  public void testTaskFailAsPersistCannotFreeAnyMoreMemory() throws Exception
  {
-    try (final AppenderatorTester tester = new AppenderatorTester(100, 10, true)) {
+    try (final AppenderatorTester tester = new AppenderatorTester(100, 5180, true)) {
      final Appenderator appenderator = tester.getAppenderator();
      final AtomicInteger eventCount = new AtomicInteger(0);
      final Supplier<Committer> committerSupplier = () -> {