blob: b54b48575f13176c2b20f266d4f3f5c1d0b5a77e [file] [log] [blame]
// Copyright 2018 The Bazel Authors. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package com.google.devtools.build.lib.collect;
import com.google.common.base.Preconditions;
import com.google.common.collect.ImmutableList;
import java.util.Comparator;
import java.util.PriorityQueue;
/**
* A streaming aggregator that, given a {@code k}, allows a streaming aggregation of {@code n}
* elements into the {@code min(k, n)} most extreme, in {@code O(min(k, n))} memory and {@code O(n *
* log(min(k, n)))} time.
*/
public abstract class Extrema<T> {
private static final Extrema<Object> EMPTY = new EmptyExtrema<>();
/**
* Creates an {@link Extrema} that can aggregate {@code n} elements into the {@code min(k, n)}
* smallest.
*/
public static <T extends Comparable<T>> Extrema<T> min(int k) {
return min(k, Comparator.<T>naturalOrder());
}
/**
* Creates an {@link Extrema} that can aggregate {@code n} elements into the {@code min(k, n)}
* smallest, per the given {@code comparator}.
*/
public static <T> Extrema<T> min(int k, Comparator<T> comparator) {
return create(k, comparator);
}
/**
* Creates an {@link Extrema} that can aggregate {@code n} elements into the {@code min(k, n)}
* largest.
*/
public static <T extends Comparable<T>> Extrema<T> max(int k) {
return max(k, Comparator.<T>naturalOrder());
}
/**
* Creates an {@link Extrema} that can aggregate {@code n} elements into the {@code min(k, n)}
* largest, per the given {@code comparator}.
*/
public static <T> Extrema<T> max(int k, Comparator<T> comparator) {
return create(k, comparator.reversed());
}
/**
* Aggregates the given element.
*
* <p>See {@link #getExtremeElements()}.
*/
public abstract void aggregate(T element);
/**
* For an {@link Extrema} created with {@code k} and with {@code n} calls to {@link #aggregate}
* since the most recent call to {@link #clear}, returns the {@code min(k, n)} most extreme of the
* those elements, sorted from most extreme to least extreme.
*/
public abstract ImmutableList<T> getExtremeElements();
/** Returns true iff {@link #getExtremeElements()} would return an empty result. */
public abstract boolean isEmpty();
/**
* Disregards all the elements {@link #aggregate}'ed already.
*
* <p>See {@link #getExtremeElements()}.
*/
public abstract void clear();
@SuppressWarnings("unchecked")
private static <T> Extrema<T> create(int k, Comparator<T> comparator) {
Preconditions.checkArgument(k >= 0, "invalid k (%s), must be >=0", k);
return k == 0 ? (Extrema<T>) EMPTY : new RegularExtrema<>(k, comparator);
}
private static class EmptyExtrema<T> extends Extrema<T> {
@Override
public void aggregate(T element) {
// no-op.
}
@Override
public ImmutableList<T> getExtremeElements() {
return ImmutableList.of();
}
@Override
public void clear() {
// no-op.
}
@Override
public boolean isEmpty() {
return true;
}
}
private static class RegularExtrema<T> extends Extrema<T> {
private final int k;
private final Comparator<T> extremaComparator;
private final PriorityQueue<T> priorityQueue;
/**
* @param k the number of extreme elements to compute
* @param extremaComparator a comparator such that {@code extremaComparator(a, b) < 0} iff
* {@code a} is more extreme than {@code b}
*/
private RegularExtrema(int k, Comparator<T> extremaComparator) {
this.k = k;
this.extremaComparator = extremaComparator;
this.priorityQueue =
new PriorityQueue<>(
/*initialCapacity=*/ k,
// Our implementation strategy is to keep a priority queue of the k most extreme
// elements
// encountered, ordered backwards; this way we have constant-time access to the least
// extreme among these elements.
extremaComparator.reversed());
}
@Override
public void aggregate(T element) {
if (priorityQueue.size() < k) {
priorityQueue.add(element);
} else {
if (extremaComparator.compare(element, priorityQueue.peek()) < 0) {
// Suppose the least extreme of the current k most extreme elements is e. If the new
// element
// is more extreme than e, then (i) it must be among the new k most extreme among the (2)
// e
// must not be.
priorityQueue.remove();
priorityQueue.add(element);
}
}
}
@Override
public ImmutableList<T> getExtremeElements() {
return ImmutableList.sortedCopyOf(extremaComparator, priorityQueue);
}
@Override
public void clear() {
priorityQueue.clear();
}
@Override
public boolean isEmpty() {
return priorityQueue.isEmpty();
}
}
}