SimpleBloomFilter.java
- /*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements. See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License. You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
- package org.apache.commons.collections4.bloomfilter;
- import java.util.Arrays;
- import java.util.Objects;
- import java.util.function.IntPredicate;
- import java.util.function.LongPredicate;
- /**
- * A bloom filter using an array of bit maps to track enabled bits. This is a standard implementation and should work well for most Bloom filters.
- *
- * @since 4.5.0-M1
- */
- public final class SimpleBloomFilter implements BloomFilter<SimpleBloomFilter> {
- /**
- * The array of bit map longs that defines this Bloom filter. Will be null if the filter is empty.
- */
- private final long[] bitMap;
- /**
- * The Shape of this Bloom filter.
- */
- private final Shape shape;
- /**
- * The cardinality of this Bloom filter.
- */
- private int cardinality;
- /**
- * Creates an empty instance.
- *
- * @param shape The shape for the filter.
- */
- public SimpleBloomFilter(final Shape shape) {
- Objects.requireNonNull(shape, "shape");
- this.shape = shape;
- this.bitMap = BitMaps.newBitMap(shape);
- this.cardinality = 0;
- }
- /**
- * Copy constructor for {@code copy()} use.
- *
- * @param source
- */
- private SimpleBloomFilter(final SimpleBloomFilter source) {
- this.shape = source.shape;
- this.bitMap = source.bitMap.clone();
- this.cardinality = source.cardinality;
- }
- @Override
- public long[] asBitMapArray() {
- return Arrays.copyOf(bitMap, bitMap.length);
- }
- @Override
- public int cardinality() {
- // Lazy evaluation with caching
- int c = cardinality;
- if (c < 0) {
- cardinality = c = SetOperations.cardinality(this);
- }
- return c;
- }
- @Override
- public int characteristics() {
- return 0;
- }
- @Override
- public void clear() {
- Arrays.fill(bitMap, 0L);
- cardinality = 0;
- }
- @Override
- public boolean contains(final IndexExtractor indexExtractor) {
- return indexExtractor.processIndices(idx -> BitMaps.contains(bitMap, idx));
- }
- /**
- * Creates a new instance of this {@link SimpleBloomFilter} with the same properties as the current one.
- *
- * @return a copy of this {@link SimpleBloomFilter}.
- */
- @Override
- public SimpleBloomFilter copy() {
- return new SimpleBloomFilter(this);
- }
- @Override
- public Shape getShape() {
- return shape;
- }
- @Override
- public boolean isEmpty() {
- return cardinality == 0 || processBitMaps(y -> y == 0);
- }
- @Override
- public boolean merge(final BitMapExtractor bitMapExtractor) {
- Objects.requireNonNull(bitMapExtractor, "bitMapExtractor");
- try {
- final int[] idx = new int[1];
- bitMapExtractor.processBitMaps(value -> {
- bitMap[idx[0]++] |= value;
- return true;
- });
- // idx[0] will be limit+1 so decrement it
- idx[0]--;
- final int idxLimit = BitMaps.getLongIndex(shape.getNumberOfBits());
- if (idxLimit == idx[0]) {
- final long excess = bitMap[idxLimit] >> shape.getNumberOfBits();
- if (excess != 0) {
- throw new IllegalArgumentException(
- String.format("BitMapExtractor set a bit higher than the limit for the shape: %s", shape.getNumberOfBits()));
- }
- }
- cardinality = -1;
- } catch (final IndexOutOfBoundsException e) {
- throw new IllegalArgumentException(String.format("BitMapExtractor should send at most %s maps", bitMap.length), e);
- }
- return true;
- }
- @Override
- public boolean merge(final BloomFilter<?> other) {
- Objects.requireNonNull(other, "other");
- if ((other.characteristics() & SPARSE) != 0) {
- merge((IndexExtractor) other);
- } else {
- merge((BitMapExtractor) other);
- }
- return true;
- }
- @Override
- public boolean merge(final Hasher hasher) {
- Objects.requireNonNull(hasher, "hasher");
- return merge(hasher.indices(shape));
- }
- @Override
- public boolean merge(final IndexExtractor indexExtractor) {
- Objects.requireNonNull(indexExtractor, "indexExtractor");
- indexExtractor.processIndices(idx -> {
- if (idx < 0 || idx >= shape.getNumberOfBits()) {
- throw new IllegalArgumentException(String.format("IndexExtractor should only send values in the range[0,%s)", shape.getNumberOfBits()));
- }
- BitMaps.set(bitMap, idx);
- return true;
- });
- cardinality = -1;
- return true;
- }
- @Override
- public boolean processBitMapPairs(final BitMapExtractor other, final LongBiPredicate func) {
- final CountingLongPredicate p = new CountingLongPredicate(bitMap, func);
- return other.processBitMaps(p) && p.processRemaining();
- }
- @Override
- public boolean processBitMaps(final LongPredicate consumer) {
- Objects.requireNonNull(consumer, "consumer");
- for (final long l : bitMap) {
- if (!consumer.test(l)) {
- return false;
- }
- }
- return true;
- }
- @Override
- public boolean processIndices(final IntPredicate consumer) {
- Objects.requireNonNull(consumer, "consumer");
- return IndexExtractor.fromBitMapExtractor(this).processIndices(consumer);
- }
- }