blob: 435a9a35abe05e5cb0ce85a8ae9ddd9f5a80bc73 [file] [log] [blame]
// Copyright 2014 The Bazel Authors. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package com.google.devtools.build.lib.skyframe;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.base.Preconditions;
import com.google.devtools.build.lib.actions.ActionExecutionStatusReporter;
import java.util.concurrent.atomic.AtomicBoolean;
/**
* An object that can monitor whether actions are getting completed in a timely manner.
*
* <p>If there's nothing happening for a while, a background thread will print (and update) the
* "Still waiting for N actions to complete..." message.
*/
public final class ActionExecutionInactivityWatchdog {
/** An object used in monitoring action execution inactivity. */
public interface InactivityMonitor {
/** Returns whether action execution has started. */
boolean hasStarted();
/** Returns the number of enqueued but not yet completed actions. */
int getPending();
/**
* Waits for any action to complete, or the timeout to elapse.
*
* <p>The thread must wait at least for the specified timeout, unless some action completes in
* the meantime. It's not allowed to return 0 too early.
*
* <p>Note that it's acceptable to return (any value) later than specified by the timeout.
*
* @return the number of actions completed during the wait
*/
int waitForNextCompletion(int timeoutSeconds) throws InterruptedException;
}
/** An object that the watchdog can report inactivity to. */
public interface InactivityReporter {
/**
* Report that actions are not getting completed in a timely manner.
*
* <p>Inactivity is typically not reported if tests with streaming output are being run.
*/
void maybeReportInactivity();
}
@VisibleForTesting
interface Sleep {
void sleep(int durationMilliseconds) throws InterruptedException;
}
private static final class WaitTime {
private final int progressIntervalFlagValue;
private int prev;
public WaitTime(int progressIntervalFlagValue) {
this.progressIntervalFlagValue = progressIntervalFlagValue;
}
public void reset() {
prev = 0;
}
public int next() {
prev = ActionExecutionStatusReporter.getWaitTime(progressIntervalFlagValue, prev);
return prev;
}
}
private final AtomicBoolean isRunning = new AtomicBoolean(false);
private final InactivityMonitor monitor;
private final InactivityReporter reporter;
private final Sleep sleeper;
private final Thread thread;
private final WaitTime waitTime;
public ActionExecutionInactivityWatchdog(InactivityMonitor monitor, InactivityReporter reporter,
int progressIntervalFlagValue) {
this(monitor, reporter, progressIntervalFlagValue, new Sleep() {
@Override
public void sleep(int durationMilliseconds) throws InterruptedException {
Thread.sleep(durationMilliseconds);
}
});
}
@VisibleForTesting
public ActionExecutionInactivityWatchdog(InactivityMonitor monitor, InactivityReporter reporter,
int progressIntervalFlagValue, Sleep sleeper) {
this.monitor = Preconditions.checkNotNull(monitor);
this.reporter = Preconditions.checkNotNull(reporter);
this.sleeper = Preconditions.checkNotNull(sleeper);
this.waitTime = new WaitTime(progressIntervalFlagValue);
this.thread = new Thread(() -> enterWatchdogLoop(), "action-execution-watchdog");
this.thread.setDaemon(true);
}
/** Starts the watchdog thread. This method should only be called once. */
public void start() {
Preconditions.checkState(!isRunning.getAndSet(true));
thread.start();
}
/**
* Stops the watchdog thread. This method should only be called once.
*
* <p>The method waits for the thread to terminate. If the caller thread is interrupted
* in the meantime, the interrupted status will be set.
*/
public void stop() {
Preconditions.checkState(isRunning.getAndSet(false));
thread.interrupt();
try {
thread.join();
} catch (InterruptedException e) {
// When Thread.join throws, the interrupted status is cleared. We need to set it again.
Thread.currentThread().interrupt();
}
}
private void enterWatchdogLoop() {
while (isRunning.get()) {
try {
// Wait a while for any SkyFunction to finish. The returned number indicates how many
// actions completed during the wait. It's possible that this is more than 1, since
// this thread may not immediately regain control.
int completedActions = monitor.waitForNextCompletion(waitTime.next());
if (!isRunning.get()) {
break;
}
int pending = monitor.getPending();
if (!monitor.hasStarted() || completedActions > 0 || pending == 0) {
// If no keys have been enqueued yet (execution hasn't started), or some actions
// were completed since this thread was notified (we are making visible progress),
// or there are currently no enqueued actions waiting to be processed (perhaps all
// have completed and we are about to stop monitoring), then there's no need to
// display any messages.
waitTime.reset();
// Sleep a while before checking again. Actions might be executing at a nice rate, no
// need to worry about inactivity. This extra sleep isn't required but it's nice to
// have: without it we would, at times of high action completion rate, unnecessarily
// put the monitor into a fast sleep-wake cycle --- not a big problem but wasteful.
sleeper.sleep(1000);
} else {
// If actions are executing but we haven't made any progress in a while (no new
// action completion), then reassure the user that we're still running. Next time
// wait a little longer.
reporter.maybeReportInactivity();
}
} catch (InterruptedException ie) {
Thread.currentThread().interrupt();
return;
}
}
}
}