/* * Copyright 2014-2017 Real Logic Ltd. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.agrona.collections; import org.agrona.BitUtil; import java.lang.reflect.Array; import java.util.*; import java.util.function.IntConsumer; import java.util.function.Predicate; import static org.agrona.collections.CollectionUtil.validateLoadFactor; /** * Open-addressing with linear-probing expandable hash set. Allocation free in steady state use when expanded. * Ability to be notified when resizing occurs so that appropriate sizing can be implemented. * * Not Threadsafe. * * This HashSet caches its iterator object, so nested iteration is not supported. * * @see ObjectIterator * @see Set * @param <T> type of values stored in the {@link java.util.Set} */ public final class ObjectHashSet<T> extends AbstractSet<T> { /** * The initial capacity used when none is specified in the constructor. */ public static final int DEFAULT_INITIAL_CAPACITY = 8; private static final Object MISSING_VALUE = null; private final float loadFactor; private int resizeThreshold; private int size; private T[] values; private final ObjectHashSetIterator iterator; private IntConsumer resizeNotifier; public ObjectHashSet() { this(DEFAULT_INITIAL_CAPACITY); } public ObjectHashSet(final int proposedCapacity) { this(proposedCapacity, Hashing.DEFAULT_LOAD_FACTOR); } @SuppressWarnings("unchecked") public ObjectHashSet(final int initialCapacity, final float loadFactor) { validateLoadFactor(loadFactor); this.loadFactor = loadFactor; size = 0; final int capacity = BitUtil.findNextPositivePowerOfTwo(initialCapacity); resizeThreshold = (int)(capacity * loadFactor); values = (T[])new Object[capacity]; Arrays.fill(values, MISSING_VALUE); // NB: references values in the constructor, so must be assigned after values iterator = new ObjectHashSetIterator(); } /** * Add a Consumer that will be called when the collection is resized. * * @param resizeNotifier IntConsumer containing the new resizeThreshold */ public void resizeNotifier(final IntConsumer resizeNotifier) { this.resizeNotifier = resizeNotifier; } /** * @param value the value to add * @return true if the collection has changed, false otherwise * @throws NullPointerException if the value is null */ public boolean add(final T value) { Objects.requireNonNull(value); final Object[] values = this.values; final int mask = values.length - 1; int index = value.hashCode() & mask; while (values[index] != MISSING_VALUE) { if (values[index].equals(value)) { return false; } index = next(index, mask); } values[index] = value; size++; if (size > resizeThreshold) { increaseCapacity(); if (resizeNotifier != null) { resizeNotifier.accept(resizeThreshold); } } return true; } private void increaseCapacity() { final int newCapacity = values.length * 2; if (newCapacity < 0) { throw new IllegalStateException("Max capacity reached at size=" + size); } rehash(newCapacity); } @SuppressWarnings("unchecked") private void rehash(final int newCapacity) { final int mask = newCapacity - 1; resizeThreshold = (int)(newCapacity * loadFactor); final T[] tempValues = (T[])new Object[newCapacity]; Arrays.fill(tempValues, MISSING_VALUE); for (final T value : values) { if (value != MISSING_VALUE) { int newHash = value.hashCode() & mask; while (tempValues[newHash] != MISSING_VALUE) { newHash = ++newHash & mask; } tempValues[newHash] = value; } } values = tempValues; } /** * @param value the value to remove * @return true if the value was present, false otherwise */ public boolean remove(final Object value) { final Object[] values = this.values; final int mask = values.length - 1; int index = value.hashCode() & mask; while (values[index] != MISSING_VALUE) { if (values[index].equals(value)) { values[index] = MISSING_VALUE; compactChain(index); size--; return true; } index = next(index, mask); } return false; } private static int next(final int index, final int mask) { return (index + 1) & mask; } @SuppressWarnings("FinalParameters") void compactChain(int deleteIndex) { final Object[] values = this.values; final int mask = values.length - 1; int index = deleteIndex; while (true) { index = next(index, mask); if (values[index] == MISSING_VALUE) { return; } final int hash = values[index].hashCode() & mask; if ((index < hash && (hash <= deleteIndex || deleteIndex <= index)) || (hash <= deleteIndex && deleteIndex <= index)) { values[deleteIndex] = values[index]; values[index] = MISSING_VALUE; deleteIndex = index; } } } /** * Compact the backing arrays by rehashing with a capacity just larger than current size * and giving consideration to the load factor. */ public void compact() { final int idealCapacity = (int)Math.round(size() * (1.0 / loadFactor)); rehash(BitUtil.findNextPositivePowerOfTwo(idealCapacity)); } /** * {@inheritDoc} */ public boolean contains(final Object value) { final Object[] values = this.values; final int mask = values.length - 1; int index = value.hashCode() & mask; while (values[index] != MISSING_VALUE) { if (values[index].equals(value)) { return true; } index = next(index, mask); } return false; } /** * {@inheritDoc} */ public int size() { return size; } /** * {@inheritDoc} */ public boolean isEmpty() { return size == 0; } /** * Get the load factor beyond which the set will increase size. * * @return load factor for when the set should increase size. */ public float loadFactor() { return loadFactor; } /** * Get the total capacity for the set to which the load factor with be a fraction of. * * @return the total capacity for the set. */ public int capacity() { return values.length; } /** * {@inheritDoc} */ public void clear() { Arrays.fill(values, MISSING_VALUE); size = 0; } /** * {@inheritDoc} */ public boolean containsAll(final Collection<?> coll) { for (final Object t : coll) { if (!contains(t)) { return false; } } return true; } /** * {@inheritDoc} */ public boolean addAll(final Collection<? extends T> coll) { return disjunction(coll, this::add); } /** * Alias for {@link #addAll(Collection)} for the specialized case when adding another ObjectHashSet, * avoids boxing and allocations * * @param coll containing the values to be added. * @return <tt>true</tt> if this set changed as a result of the call */ public boolean addAll(final ObjectHashSet<T> coll) { boolean acc = false; for (final T value : coll.values) { if (value != MISSING_VALUE) { acc |= add(value); } } return acc; } /** * Fast Path set difference for comparison with another ObjectHashSet. * * NB: garbage free in the identical case, allocates otherwise. * * @param other the other set to subtract * @return null if identical, otherwise the set of differences */ public ObjectHashSet<T> difference(final ObjectHashSet<T> other) { ObjectHashSet<T> difference = null; for (final T value : values) { if (value != MISSING_VALUE && !other.contains(value)) { if (difference == null) { difference = new ObjectHashSet<>(size); } difference.add(value); } } return difference; } /** * {@inheritDoc} */ public boolean removeAll(final Collection<?> coll) { return disjunction(coll, this::remove); } /** * Alias for {@link #removeAll(Collection)} for the specialized case when removing another ObjectHashSet, * avoids boxing and allocations * * @param coll containing the values to be removed. * @return <tt>true</tt> if this set changed as a result of the call */ public boolean removeAll(final ObjectHashSet<T> coll) { boolean acc = false; for (final T value : coll.values) { if (value != MISSING_VALUE) { acc |= remove(value); } } return acc; } private static <T> boolean disjunction(final Collection<T> coll, final Predicate<T> predicate) { boolean acc = false; for (final T t : coll) { // Deliberate strict evaluation acc |= predicate.test(t); } return acc; } /** * {@inheritDoc} */ public ObjectIterator<T> iterator() { iterator.reset(values, size); return iterator; } public void copy(final ObjectHashSet<T> that) { if (this.values.length != that.values.length) { throw new IllegalArgumentException("Cannot copy object: lengths not equal"); } System.arraycopy(that.values, 0, this.values, 0, this.values.length); this.size = that.size; } /** * {@inheritDoc} */ public String toString() { final StringBuilder sb = new StringBuilder(); sb.append('{'); for (final Object value : values) { if (value != MISSING_VALUE) { sb.append(value); sb.append(", "); } } if (sb.length() > 1) { sb.setLength(sb.length() - 2); } sb.append('}'); return sb.toString(); } /** * {@inheritDoc} */ @SuppressWarnings("unchecked") public <T1> T1[] toArray(final T1[] into) { final Class<?> componentType = into.getClass().getComponentType(); final int size = this.size; final T1[] arrayCopy = into.length >= size ? into : (T1[])Array.newInstance(componentType, size); copyValues(arrayCopy); return arrayCopy; } /** * {@inheritDoc} */ public Object[] toArray() { final Object[] arrayCopy = new Object[size]; copyValues(arrayCopy); return arrayCopy; } private void copyValues(final Object[] arrayCopy) { final ObjectIterator iterator = iterator(); for (int i = 0; iterator.hasNext(); i++) { arrayCopy[i] = iterator.next(); } } /** * {@inheritDoc} */ public boolean equals(final Object other) { if (other == this) { return true; } if (other instanceof ObjectHashSet) { final ObjectHashSet otherSet = (ObjectHashSet)other; return otherSet.size == size && containsAll(otherSet); } return false; } /** * {@inheritDoc} */ public int hashCode() { int hashCode = 0; for (final Object value : values) { if (value != MISSING_VALUE) { hashCode += value.hashCode(); } } return hashCode; } public final class ObjectHashSetIterator extends ObjectIterator<T> { ObjectHashSetIterator() { } @SuppressWarnings("unchecked") public void remove() { if (isPositionValid) { final int position = position(); values[position] = (T)MISSING_VALUE; --size; compactChain(position); isPositionValid = false; } else { throw new IllegalStateException(); } } } }