Allow value of RetainedHeapLimiter's threshold to change on each invocation.
PiperOrigin-RevId: 245266254
diff --git a/src/main/java/com/google/devtools/build/lib/runtime/BlazeCommandDispatcher.java b/src/main/java/com/google/devtools/build/lib/runtime/BlazeCommandDispatcher.java
index eb0823b..ffb9ef5 100644
--- a/src/main/java/com/google/devtools/build/lib/runtime/BlazeCommandDispatcher.java
+++ b/src/main/java/com/google/devtools/build/lib/runtime/BlazeCommandDispatcher.java
@@ -49,7 +49,6 @@
import com.google.devtools.build.lib.vfs.PathFragment;
import com.google.devtools.common.options.OpaqueOptionsData;
import com.google.devtools.common.options.OptionsParser;
-import com.google.devtools.common.options.OptionsParsingException;
import com.google.devtools.common.options.OptionsParsingResult;
import java.io.BufferedOutputStream;
import java.io.IOException;
@@ -382,18 +381,7 @@
.getOptions(BlazeServerStartupOptions.class)
.oomMoreEagerlyThreshold;
}
- if (oomMoreEagerlyThreshold < 0 || oomMoreEagerlyThreshold > 100) {
- reporter.handle(Event.error("--oom_more_eagerly_threshold must be non-negative percent"));
- return BlazeCommandResult.exitCode(ExitCode.COMMAND_LINE_ERROR);
- }
- if (oomMoreEagerlyThreshold != 100) {
- try {
- RetainedHeapLimiter.maybeInstallRetainedHeapLimiter(oomMoreEagerlyThreshold);
- } catch (OptionsParsingException e) {
- reporter.handle(Event.error(e.getMessage()));
- return BlazeCommandResult.exitCode(ExitCode.COMMAND_LINE_ERROR);
- }
- }
+ runtime.getRetainedHeapLimiter().updateThreshold(oomMoreEagerlyThreshold);
// We register an ANSI-allowing handler associated with {@code handler} so that ANSI control
// codes can be re-introduced later even if blaze is invoked with --color=no. This is useful
diff --git a/src/main/java/com/google/devtools/build/lib/runtime/BlazeRuntime.java b/src/main/java/com/google/devtools/build/lib/runtime/BlazeRuntime.java
index 103e4ce..fd1c4ac 100644
--- a/src/main/java/com/google/devtools/build/lib/runtime/BlazeRuntime.java
+++ b/src/main/java/com/google/devtools/build/lib/runtime/BlazeRuntime.java
@@ -161,6 +161,7 @@
private final BuildEventArtifactUploaderFactoryMap buildEventArtifactUploaderFactoryMap;
private final ActionKeyContext actionKeyContext;
private final ImmutableMap<String, AuthHeadersProvider> authHeadersProviderMap;
+ private final RetainedHeapLimiter retainedHeapLimiter = new RetainedHeapLimiter();
// Workspace state (currently exactly one workspace per server)
private BlazeWorkspace workspace;
@@ -490,6 +491,10 @@
return queryRuntimeHelperFactory;
}
+ RetainedHeapLimiter getRetainedHeapLimiter() {
+ return retainedHeapLimiter;
+ }
+
/**
* Hook method called by the BlazeCommandDispatcher prior to the dispatch of
* each command.
diff --git a/src/main/java/com/google/devtools/build/lib/runtime/RetainedHeapLimiter.java b/src/main/java/com/google/devtools/build/lib/runtime/RetainedHeapLimiter.java
index 4f288d3..9818921 100644
--- a/src/main/java/com/google/devtools/build/lib/runtime/RetainedHeapLimiter.java
+++ b/src/main/java/com/google/devtools/build/lib/runtime/RetainedHeapLimiter.java
@@ -14,84 +14,103 @@
package com.google.devtools.build.lib.runtime;
+import com.google.common.annotations.VisibleForTesting;
import com.google.common.base.Preconditions;
+import com.google.common.collect.ImmutableList;
+import com.google.common.flogger.GoogleLogger;
import com.google.devtools.build.lib.bugreport.BugReport;
-import com.google.devtools.common.options.OptionsParsingException;
+import com.google.devtools.build.lib.concurrent.ThreadSafety;
+import com.google.devtools.build.lib.util.AbruptExitException;
+import com.google.devtools.build.lib.util.ExitCode;
import com.sun.management.GarbageCollectionNotificationInfo;
import java.lang.management.GarbageCollectorMXBean;
import java.lang.management.ManagementFactory;
import java.lang.management.MemoryUsage;
import java.util.List;
import java.util.Map;
+import java.util.OptionalInt;
+import java.util.concurrent.TimeUnit;
import java.util.concurrent.atomic.AtomicBoolean;
-import java.util.logging.Logger;
+import java.util.concurrent.atomic.AtomicLong;
+import javax.management.ListenerNotFoundException;
import javax.management.Notification;
import javax.management.NotificationEmitter;
import javax.management.NotificationListener;
import javax.management.openmbean.CompositeData;
/**
- * Monitor the size of the retained heap and exit promptly if it grows too large. Specifically,
- * check the size of the tenured space after each major GC; if it exceeds 90%, call
- * {@code System.gc()} to trigger a stop-the-world collection; if it's still more than 90% full,
- * exit with an {@link OutOfMemoryError}.
+ * Monitor the size of the retained heap and exit promptly if it grows too large. Specifically,
+ * check the size of the tenured space after each major GC; if it exceeds {@link
+ * #occupiedHeapPercentageThreshold}%, call {@code System.gc()} to trigger a stop-the-world
+ * collection; if it's still more than {@link #occupiedHeapPercentageThreshold}% full, exit with an
+ * {@link OutOfMemoryError}.
*/
class RetainedHeapLimiter implements NotificationListener {
- private static final Logger logger = Logger.getLogger(RetainedHeapLimiter.class.getName());
+ private static final GoogleLogger logger = GoogleLogger.forEnclosingClass();
private static final long MIN_TIME_BETWEEN_TRIGGERED_GC_MILLISECONDS = 60000;
- private static int registeredOccupiedHeapPercentageThreshold = -1;
-
- static void maybeInstallRetainedHeapLimiter(int occupiedHeapPercentageThreshold)
- throws OptionsParsingException {
- if (registeredOccupiedHeapPercentageThreshold == -1) {
- registeredOccupiedHeapPercentageThreshold = occupiedHeapPercentageThreshold;
- new RetainedHeapLimiter(occupiedHeapPercentageThreshold).install();
- }
- if (registeredOccupiedHeapPercentageThreshold != occupiedHeapPercentageThreshold) {
- throw new OptionsParsingException(
- "Old threshold of "
- + registeredOccupiedHeapPercentageThreshold
- + " not equal to new threshold of "
- + occupiedHeapPercentageThreshold
- + ". To change the threshold, shut down the server and restart it with the desired "
- + "value");
- }
- }
-
- private boolean installed = false;
private final AtomicBoolean throwingOom = new AtomicBoolean(false);
- private long lastTriggeredGcInMilliseconds = 0;
- private final int occupiedHeapPercentageThreshold;
+ private final ImmutableList<NotificationEmitter> tenuredGcEmitters;
+ private OptionalInt occupiedHeapPercentageThreshold = OptionalInt.empty();
+ private AtomicLong lastTriggeredGcInMilliseconds = new AtomicLong();
- RetainedHeapLimiter(int occupiedHeapPercentageThreshold) {
- this.occupiedHeapPercentageThreshold = occupiedHeapPercentageThreshold;
+ RetainedHeapLimiter() {
+ this(ManagementFactory.getGarbageCollectorMXBeans());
}
- void install() {
- Preconditions.checkState(!installed, "RetainedHeapLimiter installed twice");
- installed = true;
- List<GarbageCollectorMXBean> gcbeans = ManagementFactory.getGarbageCollectorMXBeans();
- boolean foundTenured = false;
+ @VisibleForTesting
+ RetainedHeapLimiter(List<GarbageCollectorMXBean> gcBeans) {
+ tenuredGcEmitters = findTenuredCollectorBeans(gcBeans);
+ Preconditions.checkState(
+ !tenuredGcEmitters.isEmpty(),
+ "Can't find tenured space; update this class for a new collector");
+ }
+
+ @ThreadSafety.ThreadCompatible // Can only be called on the logical main Bazel thread.
+ void updateThreshold(int occupiedHeapPercentageThreshold) throws AbruptExitException {
+ if (occupiedHeapPercentageThreshold < 0 || occupiedHeapPercentageThreshold > 100) {
+ throw new AbruptExitException(
+ "--experimental_oom_more_eagerly_threshold must be a percent between 0 and 100 but was "
+ + occupiedHeapPercentageThreshold,
+ ExitCode.COMMAND_LINE_ERROR);
+ }
+ boolean alreadyInstalled = this.occupiedHeapPercentageThreshold.isPresent();
+ this.occupiedHeapPercentageThreshold =
+ occupiedHeapPercentageThreshold < 100
+ ? OptionalInt.of(occupiedHeapPercentageThreshold)
+ : OptionalInt.empty();
+ boolean shouldBeInstalled = this.occupiedHeapPercentageThreshold.isPresent();
+ if (alreadyInstalled && !shouldBeInstalled) {
+ for (NotificationEmitter emitter : tenuredGcEmitters) {
+ try {
+ emitter.removeNotificationListener(this, null, null);
+ } catch (ListenerNotFoundException e) {
+ logger.atWarning().log("Couldn't remove self as listener from %s", emitter);
+ }
+ }
+ } else if (!alreadyInstalled && shouldBeInstalled) {
+ tenuredGcEmitters.forEach(e -> e.addNotificationListener(this, null, null));
+ }
+ }
+
+ @VisibleForTesting
+ static ImmutableList<NotificationEmitter> findTenuredCollectorBeans(
+ List<GarbageCollectorMXBean> gcBeans) {
+ ImmutableList.Builder<NotificationEmitter> builder = ImmutableList.builder();
// Examine all collectors and register for notifications from those which collect the tenured
// space. Normally there is one such collector.
- for (GarbageCollectorMXBean gcbean : gcbeans) {
- boolean collectsTenured = false;
- for (String name : gcbean.getMemoryPoolNames()) {
- collectsTenured |= isTenuredSpace(name);
- }
- if (collectsTenured) {
- foundTenured = true;
- NotificationEmitter emitter = (NotificationEmitter) gcbean;
- emitter.addNotificationListener(this, null, null);
+ for (GarbageCollectorMXBean gcBean : gcBeans) {
+ for (String name : gcBean.getMemoryPoolNames()) {
+ if (isTenuredSpace(name)) {
+ builder.add((NotificationEmitter) gcBean);
+ }
}
}
- if (!foundTenured) {
- throw new IllegalStateException(
- "Can't find tenured space; update this class for a new collector");
- }
+ return builder.build();
}
+ // Can be called concurrently, handles concurrent calls with #updateThreshold gracefully.
+ @ThreadSafety.ThreadSafe
@Override
public void handleNotification(Notification notification, Object handback) {
if (!notification
@@ -99,6 +118,14 @@
.equals(GarbageCollectionNotificationInfo.GARBAGE_COLLECTION_NOTIFICATION)) {
return;
}
+ // Get a local reference to guard against concurrent modifications.
+ OptionalInt occupiedHeapPercentageThreshold = this.occupiedHeapPercentageThreshold;
+ if (!occupiedHeapPercentageThreshold.isPresent()) {
+ // Presumably failure above to uninstall this listener, or a racy GC.
+ logger.atInfo().atMostEvery(1, TimeUnit.MINUTES).log(
+ "Got notification %s when should be disabled", notification);
+ return;
+ }
GarbageCollectionNotificationInfo info =
GarbageCollectionNotificationInfo.from((CompositeData) notification.getUserData());
Map<String, MemoryUsage> spaces = info.getGcInfo().getMemoryUsageAfterGc();
@@ -106,12 +133,12 @@
if (isTenuredSpace(entry.getKey())) {
MemoryUsage space = entry.getValue();
if (space.getMax() == 0) {
- // The CMS collector sometimes passes us nonsense stats.
+ // The collector sometimes passes us nonsense stats.
continue;
}
long percentUsed = 100 * space.getUsed() / space.getMax();
- if (percentUsed > occupiedHeapPercentageThreshold) {
+ if (percentUsed > occupiedHeapPercentageThreshold.getAsInt()) {
if (info.getGcCause().equals("System.gc()") && !throwingOom.getAndSet(true)) {
// Assume we got here from a GC initiated by the other branch.
String exitMsg =
@@ -122,20 +149,16 @@
space.getMax(),
occupiedHeapPercentageThreshold);
System.err.println(exitMsg);
- logger.info(exitMsg);
+ logger.atInfo().log(exitMsg);
// Exits the runtime.
BugReport.handleCrash(new OutOfMemoryError(exitMsg));
- } else if (System.currentTimeMillis() - lastTriggeredGcInMilliseconds
+ } else if (System.currentTimeMillis() - lastTriggeredGcInMilliseconds.get()
> MIN_TIME_BETWEEN_TRIGGERED_GC_MILLISECONDS) {
- logger.info(
- "Triggering a full GC with "
- + space.getUsed()
- + " out of "
- + space.getMax()
- + " used");
+ logger.atInfo().log(
+ "Triggering a full GC with %s out of %s used", space.getUsed(), space.getMax());
// Force a full stop-the-world GC and see if it can get us below the threshold.
System.gc();
- lastTriggeredGcInMilliseconds = System.currentTimeMillis();
+ lastTriggeredGcInMilliseconds.set(System.currentTimeMillis());
}
}
}
diff --git a/src/test/java/com/google/devtools/build/lib/runtime/RetainedHeapLimiterTest.java b/src/test/java/com/google/devtools/build/lib/runtime/RetainedHeapLimiterTest.java
new file mode 100644
index 0000000..a91447d
--- /dev/null
+++ b/src/test/java/com/google/devtools/build/lib/runtime/RetainedHeapLimiterTest.java
@@ -0,0 +1,94 @@
+// Copyright 2019 The Bazel Authors. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package com.google.devtools.build.lib.runtime;
+
+import static com.google.common.truth.Truth.assertThat;
+import static org.mockito.Mockito.never;
+import static org.mockito.Mockito.times;
+import static org.mockito.Mockito.withSettings;
+
+import com.google.common.collect.ImmutableList;
+import com.google.devtools.build.lib.util.AbruptExitException;
+import java.lang.management.GarbageCollectorMXBean;
+import javax.management.ListenerNotFoundException;
+import javax.management.NotificationEmitter;
+import org.junit.Test;
+import org.junit.runner.RunWith;
+import org.junit.runners.JUnit4;
+import org.mockito.Mockito;
+
+/**
+ * Basic tests for {@link RetainedHeapLimiter}. More realistic tests are hard because {@link
+ * RetainedHeapLimiter} intentionally crashes the JVM.
+ */
+@RunWith(JUnit4.class)
+public class RetainedHeapLimiterTest {
+ @Test
+ public void findBeans() {
+ GarbageCollectorMXBean mockUselessBean = Mockito.mock(GarbageCollectorMXBean.class);
+ String[] untenuredPoolNames = {"assistant", "adjunct"};
+ Mockito.when(mockUselessBean.getMemoryPoolNames()).thenReturn(untenuredPoolNames);
+ GarbageCollectorMXBean mockBean =
+ Mockito.mock(
+ GarbageCollectorMXBean.class,
+ withSettings().extraInterfaces(NotificationEmitter.class));
+ String[] poolNames = {"not tenured", "CMS Old Gen"};
+ Mockito.when(mockBean.getMemoryPoolNames()).thenReturn(poolNames);
+ assertThat(
+ RetainedHeapLimiter.findTenuredCollectorBeans(
+ ImmutableList.of(mockUselessBean, mockBean)))
+ .containsExactly(mockBean);
+ }
+
+ @Test
+ public void smoke() throws AbruptExitException, ListenerNotFoundException {
+ GarbageCollectorMXBean mockUselessBean = Mockito.mock(GarbageCollectorMXBean.class);
+ String[] untenuredPoolNames = {"assistant", "adjunct"};
+ Mockito.when(mockUselessBean.getMemoryPoolNames()).thenReturn(untenuredPoolNames);
+ GarbageCollectorMXBean mockBean =
+ Mockito.mock(
+ GarbageCollectorMXBean.class,
+ withSettings().extraInterfaces(NotificationEmitter.class));
+ String[] poolNames = {"not tenured", "CMS Old Gen"};
+ Mockito.when(mockBean.getMemoryPoolNames()).thenReturn(poolNames);
+
+ RetainedHeapLimiter underTest =
+ new RetainedHeapLimiter(ImmutableList.of(mockUselessBean, mockBean));
+ underTest.updateThreshold(100);
+ Mockito.verify((NotificationEmitter) mockBean, never())
+ .addNotificationListener(underTest, null, null);
+ Mockito.verify((NotificationEmitter) mockBean, never())
+ .removeNotificationListener(underTest, null, null);
+
+ underTest.updateThreshold(90);
+ Mockito.verify((NotificationEmitter) mockBean, times(1))
+ .addNotificationListener(underTest, null, null);
+ Mockito.verify((NotificationEmitter) mockBean, never())
+ .removeNotificationListener(underTest, null, null);
+
+ underTest.updateThreshold(80);
+ // No additional calls.
+ Mockito.verify((NotificationEmitter) mockBean, times(1))
+ .addNotificationListener(underTest, null, null);
+ Mockito.verify((NotificationEmitter) mockBean, never())
+ .removeNotificationListener(underTest, null, null);
+
+ underTest.updateThreshold(100);
+ Mockito.verify((NotificationEmitter) mockBean, times(1))
+ .addNotificationListener(underTest, null, null);
+ Mockito.verify((NotificationEmitter) mockBean, times(1))
+ .removeNotificationListener(underTest, null, null);
+ }
+}