blob: 42186aaf023aa101fd91512a85d0448f7810a079 [file] [log] [blame]
// Copyright 2022 The Bazel Authors. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package com.google.devtools.build.lib.worker;
import static com.google.common.collect.ImmutableList.toImmutableList;
import com.google.common.annotations.VisibleForTesting;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import com.google.devtools.build.lib.buildeventstream.BuildEventStreamProtos.BuildMetrics.WorkerMetrics;
import com.google.devtools.build.lib.clock.Clock;
import com.google.devtools.build.lib.metrics.PsInfoCollector;
import com.google.devtools.build.lib.util.OS;
import com.google.devtools.build.lib.worker.WorkerMetric.WorkerStat;
import java.time.Instant;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;
import java.util.concurrent.ConcurrentHashMap;
/** Collects and populates system metrics about persistent workers. */
public class WorkerMetricsCollector {
/** The metrics collector (a static singleton instance). Inactive by default. */
private static final WorkerMetricsCollector instance = new WorkerMetricsCollector();
private Clock clock;
/**
* Mapping of worker process ids to their properties. One process could be mapped to multiple
* workers because of multiplex workers.
*/
private final Map<Long, WorkerMetric.WorkerProperties> processIdToWorkerProperties =
new ConcurrentHashMap<>();
private final Map<Long, Instant> workerLastCallTime = new ConcurrentHashMap<>();
private WorkerMetricsCollector() {}
public static WorkerMetricsCollector instance() {
return instance;
}
public void setClock(Clock clock) {
this.clock = clock;
}
/**
* Collects memory usage of all ancestors of processes by pid. If a pid does not allow collecting
* memory usage, it is silently ignored.
*/
PsInfoCollector.ResourceSnapshot collectMemoryUsageByPid(OS os, ImmutableSet<Long> processIds) {
// TODO(b/181317827): Support Windows.
if (processIds.isEmpty() || (os != OS.LINUX && os != OS.DARWIN)) {
return PsInfoCollector.ResourceSnapshot.create(
/* pidToMemoryInKb= */ ImmutableMap.of(), /* collectionTime= */ Instant.now());
}
return PsInfoCollector.instance().collectResourceUsage(processIds);
}
public ImmutableList<WorkerMetric> collectMetrics() {
PsInfoCollector.ResourceSnapshot resourceSnapshot =
collectMemoryUsageByPid(
OS.getCurrent(), ImmutableSet.copyOf(processIdToWorkerProperties.keySet()));
return buildWorkerMetrics(resourceSnapshot);
}
private ImmutableList<WorkerMetric> buildWorkerMetrics(
PsInfoCollector.ResourceSnapshot resourceSnapshot) {
ImmutableMap<Long, Integer> pidToMemoryInKb = resourceSnapshot.getPidToMemoryInKb();
Instant collectionTime = resourceSnapshot.getCollectionTime();
ImmutableList.Builder<WorkerMetric> workerMetrics = new ImmutableList.Builder<>();
List<Long> nonMeasurableProcessIds = new ArrayList<>();
for (WorkerMetric.WorkerProperties workerProperties : processIdToWorkerProperties.values()) {
Long pid = workerProperties.getProcessId();
WorkerStat workerStats =
WorkerStat.create(
pidToMemoryInKb.getOrDefault(pid, 0), workerLastCallTime.get(pid), collectionTime);
workerMetrics.add(
WorkerMetric.create(
workerProperties, workerStats, /* isMeasurable= */ pidToMemoryInKb.containsKey(pid)));
if (!pidToMemoryInKb.containsKey(pid)) {
nonMeasurableProcessIds.add(pid);
}
}
processIdToWorkerProperties.keySet().removeAll(nonMeasurableProcessIds);
return workerMetrics.build();
}
public ImmutableList<WorkerMetrics> createWorkerMetricsProto() {
return collectMetrics().stream().map(WorkerMetric::toProto).collect(toImmutableList());
}
public void clear() {
processIdToWorkerProperties.clear();
workerLastCallTime.clear();
}
@VisibleForTesting
Map<Long, WorkerMetric.WorkerProperties> getProcessIdToWorkerProperties() {
return processIdToWorkerProperties;
}
@VisibleForTesting
Map<Long, Instant> getWorkerLastCallTime() {
return workerLastCallTime;
}
/**
* Initializes workerIdToWorkerProperties for workers. If worker metrics already exists for this
* worker, only updates workerLastCallTime.
*/
public synchronized void registerWorker(
int workerId,
long processId,
String mnemonic,
boolean isMultiplex,
boolean isSandboxed,
int workerKeyHash) {
WorkerMetric.WorkerProperties existingWorkerProperties =
processIdToWorkerProperties.get(processId);
workerLastCallTime.put(processId, Instant.ofEpochMilli(clock.currentTimeMillis()));
if (existingWorkerProperties == null) {
processIdToWorkerProperties.put(
processId,
WorkerMetric.WorkerProperties.create(
ImmutableList.of(workerId),
processId,
mnemonic,
isMultiplex,
isSandboxed,
workerKeyHash));
return;
}
if (existingWorkerProperties.getWorkerIds().contains(workerId)) {
return;
}
ImmutableList<Integer> updatedWorkerIds =
ImmutableList.<Integer>builder()
.addAll(existingWorkerProperties.getWorkerIds())
.add(workerId)
.build();
WorkerMetric.WorkerProperties updatedWorkerProperties =
WorkerMetric.WorkerProperties.create(
updatedWorkerIds, processId, mnemonic, isMultiplex, isSandboxed, workerKeyHash);
processIdToWorkerProperties.put(processId, updatedWorkerProperties);
}
// TODO(b/238416583) Add deregister function
}