| // Copyright 2017 The Bazel Authors. All rights reserved. |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| package com.google.devtools.build.lib.remote; |
| |
| import com.google.common.annotations.VisibleForTesting; |
| import com.google.common.base.Throwables; |
| import com.google.common.collect.ImmutableMap; |
| import com.google.devtools.build.lib.actions.ActionInput; |
| import com.google.devtools.build.lib.actions.ActionInputFileCache; |
| import com.google.devtools.build.lib.actions.EnvironmentalExecException; |
| import com.google.devtools.build.lib.actions.ExecException; |
| import com.google.devtools.build.lib.actions.Spawn; |
| import com.google.devtools.build.lib.actions.SpawnResult; |
| import com.google.devtools.build.lib.actions.SpawnResult.Status; |
| import com.google.devtools.build.lib.actions.Spawns; |
| import com.google.devtools.build.lib.actions.cache.VirtualActionInput; |
| import com.google.devtools.build.lib.analysis.platform.PlatformInfo; |
| import com.google.devtools.build.lib.cmdline.Label; |
| import com.google.devtools.build.lib.concurrent.ThreadSafety.ThreadSafe; |
| import com.google.devtools.build.lib.events.Event; |
| import com.google.devtools.build.lib.events.Reporter; |
| import com.google.devtools.build.lib.exec.SpawnExecException; |
| import com.google.devtools.build.lib.exec.SpawnRunner; |
| import com.google.devtools.build.lib.remote.DigestUtil.ActionKey; |
| import com.google.devtools.build.lib.remote.Retrier.RetryException; |
| import com.google.devtools.build.lib.remote.TreeNodeRepository.TreeNode; |
| import com.google.devtools.build.lib.util.ExitCode; |
| import com.google.devtools.build.lib.util.io.FileOutErr; |
| import com.google.devtools.build.lib.vfs.Path; |
| import com.google.devtools.build.lib.vfs.PathFragment; |
| import com.google.devtools.remoteexecution.v1test.Action; |
| import com.google.devtools.remoteexecution.v1test.ActionResult; |
| import com.google.devtools.remoteexecution.v1test.Command; |
| import com.google.devtools.remoteexecution.v1test.Digest; |
| import com.google.devtools.remoteexecution.v1test.ExecuteRequest; |
| import com.google.devtools.remoteexecution.v1test.ExecuteResponse; |
| import com.google.devtools.remoteexecution.v1test.Platform; |
| import com.google.protobuf.TextFormat; |
| import com.google.protobuf.TextFormat.ParseException; |
| import io.grpc.Context; |
| import io.grpc.Status.Code; |
| import java.io.IOException; |
| import java.io.OutputStream; |
| import java.nio.charset.StandardCharsets; |
| import java.time.Duration; |
| import java.util.ArrayList; |
| import java.util.Collection; |
| import java.util.Collections; |
| import java.util.HashMap; |
| import java.util.List; |
| import java.util.Map; |
| import java.util.SortedMap; |
| import java.util.TreeSet; |
| import java.util.concurrent.atomic.AtomicBoolean; |
| import javax.annotation.Nullable; |
| |
| /** A client for the remote execution service. */ |
| @ThreadSafe |
| class RemoteSpawnRunner implements SpawnRunner { |
| private static final int POSIX_TIMEOUT_EXIT_CODE = /*SIGNAL_BASE=*/128 + /*SIGALRM=*/14; |
| |
| private final Path execRoot; |
| private final RemoteOptions options; |
| private final SpawnRunner fallbackRunner; |
| private final boolean verboseFailures; |
| |
| @Nullable private final Reporter cmdlineReporter; |
| @Nullable private final AbstractRemoteActionCache remoteCache; |
| @Nullable private final GrpcRemoteExecutor remoteExecutor; |
| private final String buildRequestId; |
| private final String commandId; |
| private final DigestUtil digestUtil; |
| |
| // Used to ensure that a warning is reported only once. |
| private final AtomicBoolean warningReported = new AtomicBoolean(); |
| |
| RemoteSpawnRunner( |
| Path execRoot, |
| RemoteOptions options, |
| SpawnRunner fallbackRunner, |
| boolean verboseFailures, |
| @Nullable Reporter cmdlineReporter, |
| String buildRequestId, |
| String commandId, |
| @Nullable AbstractRemoteActionCache remoteCache, |
| @Nullable GrpcRemoteExecutor remoteExecutor, |
| DigestUtil digestUtil) { |
| this.execRoot = execRoot; |
| this.options = options; |
| this.fallbackRunner = fallbackRunner; |
| this.remoteCache = remoteCache; |
| this.remoteExecutor = remoteExecutor; |
| this.verboseFailures = verboseFailures; |
| this.cmdlineReporter = cmdlineReporter; |
| this.buildRequestId = buildRequestId; |
| this.commandId = commandId; |
| this.digestUtil = digestUtil; |
| } |
| |
| @Override |
| public SpawnResult exec(Spawn spawn, SpawnExecutionPolicy policy) |
| throws ExecException, InterruptedException, IOException { |
| if (!Spawns.mayBeExecutedRemotely(spawn) || remoteCache == null) { |
| return fallbackRunner.exec(spawn, policy); |
| } |
| |
| policy.report(ProgressStatus.EXECUTING, "remote"); |
| // Temporary hack: the TreeNodeRepository should be created and maintained upstream! |
| ActionInputFileCache inputFileCache = policy.getActionInputFileCache(); |
| TreeNodeRepository repository = new TreeNodeRepository(execRoot, inputFileCache, digestUtil); |
| SortedMap<PathFragment, ActionInput> inputMap = policy.getInputMapping(); |
| TreeNode inputRoot = repository.buildFromActionInputs(inputMap); |
| repository.computeMerkleDigests(inputRoot); |
| Command command = buildCommand(spawn.getArguments(), spawn.getEnvironment()); |
| Action action = |
| buildAction( |
| execRoot, |
| spawn.getOutputFiles(), |
| digestUtil.compute(command), |
| repository.getMerkleDigest(inputRoot), |
| spawn.getExecutionPlatform(), |
| policy.getTimeout(), |
| Spawns.mayBeCached(spawn)); |
| |
| // Look up action cache, and reuse the action output if it is found. |
| ActionKey actionKey = digestUtil.computeActionKey(action); |
| Context withMetadata = |
| TracingMetadataUtils.contextWithMetadata(buildRequestId, commandId, actionKey); |
| Context previous = withMetadata.attach(); |
| try { |
| boolean acceptCachedResult = options.remoteAcceptCached && Spawns.mayBeCached(spawn); |
| boolean uploadLocalResults = options.remoteUploadLocalResults; |
| |
| try { |
| // Try to lookup the action in the action cache. |
| ActionResult cachedResult = |
| acceptCachedResult ? remoteCache.getCachedActionResult(actionKey) : null; |
| if (cachedResult != null) { |
| if (cachedResult.getExitCode() != 0) { |
| // The remote cache must never serve a failed action. |
| throw new EnvironmentalExecException( |
| "The remote cache is in an invalid state as it" |
| + " served a failed action. Hash of the action: " |
| + actionKey.getDigest()); |
| } |
| try { |
| return downloadRemoteResults(cachedResult, policy.getFileOutErr()) |
| .setCacheHit(true) |
| .build(); |
| } catch (CacheNotFoundException e) { |
| // No cache hit, so we fall through to local or remote execution. |
| // We set acceptCachedResult to false in order to force the action re-execution. |
| acceptCachedResult = false; |
| } |
| } |
| } catch (IOException e) { |
| return execLocallyOrFail(spawn, policy, inputMap, actionKey, uploadLocalResults, e); |
| } |
| |
| if (remoteExecutor == null) { |
| // Remote execution is disabled and so execute the spawn on the local machine. |
| return execLocally(spawn, policy, inputMap, uploadLocalResults, remoteCache, actionKey); |
| } |
| |
| try { |
| // Upload the command and all the inputs into the remote cache. |
| remoteCache.ensureInputsPresent(repository, execRoot, inputRoot, command); |
| } catch (IOException e) { |
| return execLocallyOrFail(spawn, policy, inputMap, actionKey, uploadLocalResults, e); |
| } |
| |
| final ActionResult result; |
| try { |
| ExecuteRequest.Builder request = |
| ExecuteRequest.newBuilder() |
| .setInstanceName(options.remoteInstanceName) |
| .setAction(action) |
| .setSkipCacheLookup(!acceptCachedResult); |
| ExecuteResponse reply = remoteExecutor.executeRemotely(request.build()); |
| result = reply.getResult(); |
| } catch (IOException e) { |
| return execLocallyOrFail(spawn, policy, inputMap, actionKey, uploadLocalResults, e); |
| } |
| |
| try { |
| return downloadRemoteResults(result, policy.getFileOutErr()).build(); |
| } catch (IOException e) { |
| return execLocallyOrFail(spawn, policy, inputMap, actionKey, uploadLocalResults, e); |
| } |
| } finally { |
| withMetadata.detach(previous); |
| } |
| } |
| |
| private SpawnResult.Builder downloadRemoteResults(ActionResult result, FileOutErr outErr) |
| throws ExecException, IOException, InterruptedException { |
| remoteCache.download(result, execRoot, outErr); |
| int exitCode = result.getExitCode(); |
| return new SpawnResult.Builder() |
| .setStatus(exitCode == 0 ? Status.SUCCESS : Status.NON_ZERO_EXIT) |
| .setExitCode(exitCode); |
| } |
| |
| private SpawnResult execLocallyOrFail( |
| Spawn spawn, |
| SpawnExecutionPolicy policy, |
| SortedMap<PathFragment, ActionInput> inputMap, |
| ActionKey actionKey, |
| boolean uploadLocalResults, |
| IOException cause) |
| throws ExecException, InterruptedException, IOException { |
| if (options.remoteLocalFallback && !(cause instanceof TimeoutException)) { |
| return execLocally(spawn, policy, inputMap, uploadLocalResults, remoteCache, actionKey); |
| } |
| return handleError(cause, policy.getFileOutErr()); |
| } |
| |
| private SpawnResult handleError(IOException exception, FileOutErr outErr) throws IOException, |
| ExecException { |
| final Throwable cause = exception.getCause(); |
| if (exception instanceof TimeoutException || cause instanceof TimeoutException) { |
| // TODO(buchgr): provide stdout/stderr from the action that timed out. |
| // Remove the unsuported message once remote execution tests no longer check for it. |
| try (OutputStream out = outErr.getOutputStream()) { |
| String msg = "Log output for timeouts is not yet supported in remote execution.\n"; |
| out.write(msg.getBytes(StandardCharsets.UTF_8)); |
| } |
| return new SpawnResult.Builder() |
| .setStatus(Status.TIMEOUT) |
| .setExitCode(POSIX_TIMEOUT_EXIT_CODE) |
| .build(); |
| } |
| final Status status; |
| if (exception instanceof RetryException |
| && RemoteRetrierUtils.causedByStatus((RetryException) exception, Code.UNAVAILABLE)) { |
| status = Status.EXECUTION_FAILED_CATASTROPHICALLY; |
| } else if (exception instanceof CacheNotFoundException |
| || cause instanceof CacheNotFoundException) { |
| status = Status.REMOTE_CACHE_FAILED; |
| } else { |
| status = Status.EXECUTION_FAILED; |
| } |
| throw new SpawnExecException( |
| Throwables.getStackTraceAsString(exception), |
| new SpawnResult.Builder() |
| .setStatus(status) |
| .setExitCode(ExitCode.REMOTE_ERROR.getNumericExitCode()) |
| .build(), |
| /* forciblyRunRemotely= */ false); |
| } |
| |
| static Action buildAction( |
| Path execRoot, |
| Collection<? extends ActionInput> outputs, |
| Digest command, |
| Digest inputRoot, |
| @Nullable PlatformInfo executionPlatform, |
| Duration timeout, |
| boolean cacheable) { |
| |
| Action.Builder action = Action.newBuilder(); |
| action.setCommandDigest(command); |
| action.setInputRootDigest(inputRoot); |
| ArrayList<String> outputPaths = new ArrayList<>(); |
| ArrayList<String> outputDirectoryPaths = new ArrayList<>(); |
| for (ActionInput output : outputs) { |
| String pathString = output.getExecPathString(); |
| if (execRoot.getRelative(pathString).isDirectory()) { |
| outputDirectoryPaths.add(pathString); |
| } else { |
| outputPaths.add(pathString); |
| } |
| } |
| Collections.sort(outputPaths); |
| Collections.sort(outputDirectoryPaths); |
| action.addAllOutputFiles(outputPaths); |
| action.addAllOutputDirectories(outputDirectoryPaths); |
| |
| // Get the remote platform properties. |
| if (executionPlatform != null) { |
| Platform platform = |
| parsePlatform(executionPlatform.label(), executionPlatform.remoteExecutionProperties()); |
| action.setPlatform(platform); |
| } |
| |
| if (!timeout.isZero()) { |
| action.setTimeout(com.google.protobuf.Duration.newBuilder().setSeconds(timeout.getSeconds())); |
| } |
| if (!cacheable) { |
| action.setDoNotCache(true); |
| } |
| return action.build(); |
| } |
| |
| static Platform parsePlatform(Label platformLabel, @Nullable String platformDescription) { |
| Platform.Builder platformBuilder = Platform.newBuilder(); |
| try { |
| if (platformDescription != null) { |
| TextFormat.getParser().merge(platformDescription, platformBuilder); |
| } |
| } catch (ParseException e) { |
| throw new IllegalArgumentException( |
| String.format( |
| "Failed to parse remote_execution_properties from platform %s", platformLabel), |
| e); |
| } |
| return platformBuilder.build(); |
| } |
| |
| static Command buildCommand(List<String> arguments, ImmutableMap<String, String> env) { |
| Command.Builder command = Command.newBuilder(); |
| command.addAllArguments(arguments); |
| // Sorting the environment pairs by variable name. |
| TreeSet<String> variables = new TreeSet<>(env.keySet()); |
| for (String var : variables) { |
| command.addEnvironmentVariablesBuilder().setName(var).setValue(env.get(var)); |
| } |
| return command.build(); |
| } |
| |
| private Map<Path, Long> getInputCtimes(SortedMap<PathFragment, ActionInput> inputMap) { |
| HashMap<Path, Long> ctimes = new HashMap<>(); |
| for (Map.Entry<PathFragment, ActionInput> e : inputMap.entrySet()) { |
| ActionInput input = e.getValue(); |
| if (input instanceof VirtualActionInput) { |
| continue; |
| } |
| Path path = execRoot.getRelative(input.getExecPathString()); |
| try { |
| ctimes.put(path, path.stat().getLastChangeTime()); |
| } catch (IOException ex) { |
| // Put a token value indicating an exception; this is used so that if the exception |
| // is raised both before and after the execution, it is ignored, but if it is raised only |
| // one of the times, it triggers a remote cache upload skip. |
| ctimes.put(path, -1L); |
| } |
| } |
| return ctimes; |
| } |
| |
| /** |
| * Execute a {@link Spawn} locally, using {@link #fallbackRunner}. |
| * |
| * <p>If possible also upload the {@link SpawnResult} to a remote cache. |
| */ |
| private SpawnResult execLocally( |
| Spawn spawn, |
| SpawnExecutionPolicy policy, |
| SortedMap<PathFragment, ActionInput> inputMap, |
| boolean uploadToCache, |
| @Nullable AbstractRemoteActionCache remoteCache, |
| @Nullable ActionKey actionKey) |
| throws ExecException, IOException, InterruptedException { |
| if (uploadToCache && remoteCache != null && actionKey != null) { |
| return execLocallyAndUpload(spawn, policy, inputMap, remoteCache, actionKey); |
| } |
| return fallbackRunner.exec(spawn, policy); |
| } |
| |
| @VisibleForTesting |
| SpawnResult execLocallyAndUpload( |
| Spawn spawn, |
| SpawnExecutionPolicy policy, |
| SortedMap<PathFragment, ActionInput> inputMap, |
| AbstractRemoteActionCache remoteCache, |
| ActionKey actionKey) |
| throws ExecException, IOException, InterruptedException { |
| Map<Path, Long> ctimesBefore = getInputCtimes(inputMap); |
| SpawnResult result = fallbackRunner.exec(spawn, policy); |
| Map<Path, Long> ctimesAfter = getInputCtimes(inputMap); |
| for (Map.Entry<Path, Long> e : ctimesBefore.entrySet()) { |
| // Skip uploading to remote cache, because an input was modified during execution. |
| if (!ctimesAfter.get(e.getKey()).equals(e.getValue())) { |
| return result; |
| } |
| } |
| List<Path> outputFiles = listExistingOutputFiles(execRoot, spawn); |
| try { |
| boolean uploadAction = |
| Spawns.mayBeCached(spawn) |
| && Status.SUCCESS.equals(result.status()) |
| && result.exitCode() == 0; |
| remoteCache.upload(actionKey, execRoot, outputFiles, policy.getFileOutErr(), uploadAction); |
| } catch (IOException e) { |
| if (verboseFailures) { |
| report(Event.debug("Upload to remote cache failed: " + e.getMessage())); |
| } else { |
| reportOnce(Event.warn("Some artifacts failed be uploaded to the remote cache.")); |
| } |
| } |
| return result; |
| } |
| |
| private void reportOnce(Event evt) { |
| if (warningReported.compareAndSet(false, true)) { |
| report(evt); |
| } |
| } |
| |
| private void report(Event evt) { |
| if (cmdlineReporter != null) { |
| cmdlineReporter.handle(evt); |
| } |
| } |
| |
| static List<Path> listExistingOutputFiles(Path execRoot, Spawn spawn) { |
| ArrayList<Path> outputFiles = new ArrayList<>(); |
| for (ActionInput output : spawn.getOutputFiles()) { |
| Path outputPath = execRoot.getRelative(output.getExecPathString()); |
| // TODO(ulfjack): Store the actual list of output files in SpawnResult and use that instead |
| // of statting the files here again. |
| if (outputPath.exists()) { |
| outputFiles.add(outputPath); |
| } |
| } |
| return outputFiles; |
| } |
| } |